[ { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334941_664715290402166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is backpack (annotated by the red box) located relative to bicycle? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669876_10407333805500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, screen door (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) screen door\n(B) tap" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471489824628958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, swivel chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) swivel chair\n(B) table" }, { "from": "gpt", "value": "(A) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204329_14347614919083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) table\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739814_15631651549416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window (highlighted by a red box), window (highlighted by a blue box) or door (highlighted by a green box)?\n(A) window\n(B) door" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458260_74262343943791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, screen door (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) screen door\n(B) window screen" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430808_64038305991166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, screen door (highlighted by a red box) or toilet bowl (highlighted by a blue box)?\n(A) screen door\n(B) toilet bowl" }, { "from": "gpt", "value": "(B) toilet bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331942_164661724079708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, desk (highlighted by a red box) or box (highlighted by a blue box)?\n(A) desk\n(B) box" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018608_633244509572500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, box (highlighted by a red box) or window (highlighted by a blue box)?\n(A) box\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333864_75489546159000_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261651_1363022573958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or window (highlighted by a blue box)?\n(A) picture frame\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739459_51775592542583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from furniture (highlighted by a red box)? Choose from table (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) table\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896063_132127003219790_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or refrigerator (highlighted by a blue box)?\n(A) chair\n(B) refrigerator" }, { "from": "gpt", "value": "(B) refrigerator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331133_175752029265625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, sink (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) sink\n(B) basket" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896097_145219901080208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899491_197775653956166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from feeding chair (highlighted by a red box)? Choose among these: window frame (highlighted by a blue box) or chair (highlighted by a green box).\n(A) window frame\n(B) chair" }, { "from": "gpt", "value": "(A) window frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115412_4206760563125_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896512_33388267552791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to picture frame (highlighted by a red box), furniture (highlighted by a blue box) or table (highlighted by a green box)?\n(A) furniture\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332198_263703248723000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to bath mat (highlighted by a red box)? faucet (highlighted by a blue box) or sink (highlighted by a green box).\n(A) faucet\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899654_233422276583583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, studio couch (highlighted by a red box) or couch (highlighted by a blue box)?\n(A) studio couch\n(B) couch" }, { "from": "gpt", "value": "(B) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898506_160850790415583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to book (highlighted by a red box), book (highlighted by a blue box) or desk (highlighted by a green box)?\n(A) book\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333040_59756264967250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from table (highlighted by a red box)? chair (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) chair\n(B) bottle" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018445_526692195914124_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899900_1026974032554208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, table lamp (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333803_51498852317750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or plate (highlighted by a blue box)?\n(A) chair\n(B) plate" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670184_51698634192875_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332473_886556167155125_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261241_15104204634750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to character sculpture (highlighted by a red box)? Choose from character sculpture (highlighted by a blue box) and character sculpture (highlighted by a green box).\n(A) character sculpture\n(B) character sculpture" }, { "from": "gpt", "value": "(B) character sculpture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018634_635970678016333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895196_39143428956375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table lamp (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204363_15902923166041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, footwear (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) footwear\n(B) footwear" }, { "from": "gpt", "value": "(A) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897924_348987844541458_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446061_80599078323125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, path (highlighted by a red box) or door (highlighted by a blue box)?\n(A) path\n(B) door" }, { "from": "gpt", "value": "(A) path" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899340_714909045739125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, round table (highlighted by a red box) or plywood (highlighted by a blue box)?\n(A) round table\n(B) plywood" }, { "from": "gpt", "value": "(A) round table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429955_140614378507333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the sink (highlighted by a red box)? toothbrush (highlighted by a blue box) or bathroom cabinet (highlighted by a green box).\n(A) toothbrush\n(B) bathroom cabinet" }, { "from": "gpt", "value": "(B) bathroom cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444696_72540776745250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, cabinetry (highlighted by a red box) or faucet (highlighted by a blue box)?\n(A) cabinetry\n(B) faucet" }, { "from": "gpt", "value": "(B) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458582_1554874526458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, porcelain (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) porcelain\n(B) tap" }, { "from": "gpt", "value": "(A) porcelain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333153_41544319346000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to toy (highlighted by a red box), changing table (highlighted by a blue box) or blanket (highlighted by a green box)?\n(A) changing table\n(B) blanket" }, { "from": "gpt", "value": "(A) changing table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115238_97780883819375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, curtain (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) curtain\n(B) picture frame" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332818_48818807294083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, curtain (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) curtain\n(B) doormat" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898021_220937136230541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to curtain (highlighted by a red box)? Select from window (highlighted by a blue box) and chair (highlighted by a green box).\n(A) window\n(B) chair" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796590_17466475792500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, shower (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) shower\n(B) ceramic tile" }, { "from": "gpt", "value": "(B) ceramic tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261695_603741524083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to window (highlighted by a red box)? Choose from lamp (highlighted by a blue box) and lamp (highlighted by a green box).\n(A) lamp\n(B) lamp" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115131_85648145804375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from door (highlighted by a red box)? faucet (highlighted by a blue box) or toilet (highlighted by a green box)?\n(A) faucet\n(B) toilet" }, { "from": "gpt", "value": "(B) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896188_141845428118916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, garage door (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) garage door\n(B) screen door" }, { "from": "gpt", "value": "(A) garage door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895298_91095138433541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or television (highlighted by a blue box)?\n(A) picture frame\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899268_883878195961791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, mirror (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) mirror\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898710_581484814994416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from elevator (highlighted by a red box)? Choose from elevator (highlighted by a blue box) and light fixture (highlighted by a green box).\n(A) elevator\n(B) light fixture" }, { "from": "gpt", "value": "(B) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332624_365537390733375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, person (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) person\n(B) picture frame" }, { "from": "gpt", "value": "(A) person" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739635_2290152125708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to toiletry (highlighted by a red box)? Choose from bath (highlighted by a blue box) and toilet (highlighted by a green box).\n(A) bath\n(B) toilet" }, { "from": "gpt", "value": "(A) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458337_102896725512250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, mat (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) mat\n(B) pillow" }, { "from": "gpt", "value": "(A) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649464_13883129043666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from book (highlighted by a red box)? Select from book (highlighted by a blue box) and bookcase (highlighted by a green box).\n(A) book\n(B) bookcase" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331910_627584769701250_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331423_544269119624875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of chair (annotated by the red box) in reference to chair?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828324_77735878053500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, nightstand (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) nightstand\n(B) furniture" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333144_40436725573291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to poster page (highlighted by a red box)? national flag (highlighted by a blue box) or art (highlighted by a green box).\n(A) national flag\n(B) art" }, { "from": "gpt", "value": "(B) art" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261219_13518815624916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, window (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) window\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331279_14312486262791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhere is shelf (annotated by the red box) located in relation to cabinet in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895249_75852191542416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899285_885255565239875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the doormat (highlighted by a red box)? Choose among these: gas stove (highlighted by a blue box) or stainless steel (highlighted by a green box).\n(A) gas stove\n(B) stainless steel" }, { "from": "gpt", "value": "(A) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334935_663090898567166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from coffee cup (highlighted by a red box)? chair (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) chair\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332487_341136086468708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to sink (highlighted by a red box)? Choose from bathroom cabinet (highlighted by a blue box) and mirror (highlighted by a green box).\n(A) bathroom cabinet\n(B) mirror" }, { "from": "gpt", "value": "(A) bathroom cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115201_94448150995500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from door (highlighted by a red box)? Choose among these: laundry (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) laundry\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331378_198321087220916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796326_16169071316458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chest of drawers (highlighted by a red box) or ladder (highlighted by a blue box)?\n(A) chest of drawers\n(B) ladder" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796562_15954475119250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, picture frame (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) picture frame\n(B) radiator" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796475_4284932749708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from hat (highlighted by a red box)? Choose from toy (highlighted by a blue box) and book (highlighted by a green box).\n(A) toy\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447210_209184258853333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to screen door (highlighted by a red box)? Choose from sink (highlighted by a blue box) and swivel chair (highlighted by a green box).\n(A) sink\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204362_15639125119916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the picture frame (highlighted by a red box)? picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018608_633226516936833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) window\n(B) chair" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898350_511456770530916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window (highlighted by a red box), wall clock (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) wall clock\n(B) curtain" }, { "from": "gpt", "value": "(A) wall clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899209_186753380119125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to table (highlighted by a red box), curtain (highlighted by a blue box) or table (highlighted by a green box)?\n(A) curtain\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828478_100710750317666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, appliance (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) appliance\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895949_109112715628375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from mug (highlighted by a red box)? stool (highlighted by a blue box) or sink (highlighted by a green box)?\n(A) stool\n(B) sink" }, { "from": "gpt", "value": "(A) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_409050904206583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or magazine (highlighted by a blue box)?\n(A) door\n(B) magazine" }, { "from": "gpt", "value": "(B) magazine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898701_580949994578625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of picture frame (annotated by the red box) in reference to picture frame?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429773_359932729415958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bed (highlighted by a red box) or nightstand (highlighted by a blue box)?\n(A) bed\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204920_3744890830750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or television (highlighted by a blue box)?\n(A) furniture\n(B) television" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663349_91098008814333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, shutter (highlighted by a red box) or door (highlighted by a blue box)?\n(A) shutter\n(B) door" }, { "from": "gpt", "value": "(A) shutter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261527_45656748560250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669851_12519852058708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204876_3594336259125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to toilet (highlighted by a red box), radiator (highlighted by a blue box) or sink (highlighted by a green box)?\n(A) radiator\n(B) sink" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895478_134511723182333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) table\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458556_128064016650208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to shoe (highlighted by a red box)? Choose from radiator (highlighted by a blue box) and door (highlighted by a green box).\n(A) radiator\n(B) door" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333847_74947820091666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, ipad (highlighted by a red box) or round table (highlighted by a blue box)?\n(A) ipad\n(B) round table" }, { "from": "gpt", "value": "(B) round table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898899_816930734488916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is toilet paper (annotated by the red box) located in relation to toilet paper in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332810_48204821937708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window (highlighted by a red box) or steering wheel (highlighted by a blue box)?\n(A) window\n(B) steering wheel" }, { "from": "gpt", "value": "(B) steering wheel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649720_48008953158000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, sink (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) sink\n(B) appliance" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458262_74209148303666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to clothesline (highlighted by a red box), trousers (highlighted by a blue box) or closet (highlighted by a green box)?\n(A) trousers\n(B) closet" }, { "from": "gpt", "value": "(B) closet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333244_33497304154500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, movie poster (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) movie poster\n(B) picture frame" }, { "from": "gpt", "value": "(A) movie poster" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796576_16728864072458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, nightstand (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) nightstand\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115217_94942733022083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, appliance (highlighted by a red box) or door (highlighted by a blue box)?\n(A) appliance\n(B) door" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445590_284245041480000_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204747_25286687661333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window sill (highlighted by a red box), mantle (highlighted by a blue box) or studio couch (highlighted by a green box)?\n(A) mantle\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649743_49747900717250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to picture frame (highlighted by a red box)? picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261686_3789953013041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to pillow (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) pillow\n(B) picture frame" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334471_102415951779958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, curtain (highlighted by a red box) or bay window (highlighted by a blue box)?\n(A) curtain\n(B) bay window" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358328_19187072574208_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333134_39246870209416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of footwear (annotated by the red box) and footwear in the image provided, where is footwear (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669980_28888794651375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to swivel chair (highlighted by a red box)? Choose from bunk bed (highlighted by a blue box) and table (highlighted by a green box).\n(A) bunk bed\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897890_345033712360000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, poster page (highlighted by a red box) or computer monitor (highlighted by a blue box)?\n(A) poster page\n(B) computer monitor" }, { "from": "gpt", "value": "(A) poster page" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899900_1026934032296666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, storage box (highlighted by a red box) or storage box (highlighted by a blue box)?\n(A) storage box\n(B) storage box" }, { "from": "gpt", "value": "(A) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896484_23842704080708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, pillow (highlighted by a red box) or window (highlighted by a blue box)?\n(A) pillow\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261645_583098749208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, pillow (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) pillow\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898024_220862732854166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898510_160667699681375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from radiator (highlighted by a red box)? Choose from mirror (highlighted by a blue box) and door (highlighted by a green box).\n(A) mirror\n(B) door" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446488_356811850527291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, countertop (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) countertop\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828311_76536540516625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from bench (highlighted by a red box)? Select from table (highlighted by a blue box) and rail (highlighted by a green box).\n(A) table\n(B) rail" }, { "from": "gpt", "value": "(B) rail" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796507_3197608214541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649802_46909288861083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is studio couch (annotated by the red box) located in relation to pillow in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429771_360051930924166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or vase (highlighted by a blue box)?\n(A) picture frame\n(B) vase" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899284_885322354157458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the cloth (highlighted by a red box)? kitchen appliance (highlighted by a blue box) or cutting board (highlighted by a green box).\n(A) kitchen appliance\n(B) cutting board" }, { "from": "gpt", "value": "(B) cutting board" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334267_156726272958916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to plant (highlighted by a red box)? Select from table (highlighted by a blue box) and air conditioning (highlighted by a green box).\n(A) table\n(B) air conditioning" }, { "from": "gpt", "value": "(B) air conditioning" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649729_48930818639708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window frame (highlighted by a red box) or bay window (highlighted by a blue box)?\n(A) window frame\n(B) bay window" }, { "from": "gpt", "value": "(A) window frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446485_355962350082958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, plant (highlighted by a red box) or table (highlighted by a blue box)?\n(A) plant\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446466_355354448437166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, houseplant (highlighted by a red box) or table (highlighted by a blue box)?\n(A) houseplant\n(B) table" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796744_28934075989666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of desk (annotated by the red box) in relation to jug?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796438_680618071583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, mirror (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) mirror\n(B) cabinetry" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828320_76241740437500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the swivel chair (highlighted by a red box)? Choose among these: coffee table (highlighted by a blue box) or bench (highlighted by a green box).\n(A) coffee table\n(B) bench" }, { "from": "gpt", "value": "(B) bench" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018778_15481587237708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to mouthwash (highlighted by a red box)? toilet paper (highlighted by a blue box) or brush (highlighted by a green box).\n(A) toilet paper\n(B) brush" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261381_26864120546958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, screen door (highlighted by a red box) or stationary bicycle (highlighted by a blue box)?\n(A) screen door\n(B) stationary bicycle" }, { "from": "gpt", "value": "(B) stationary bicycle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897818_132724688336250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, material (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) material\n(B) pillow" }, { "from": "gpt", "value": "(A) material" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446444_82601013538833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or window frame (highlighted by a blue box)?\n(A) picture frame\n(B) window frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669960_27593090502708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cabinetry (highlighted by a red box)? faucet (highlighted by a blue box) or silver (highlighted by a green box)?\n(A) faucet\n(B) silver" }, { "from": "gpt", "value": "(A) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899913_1028269563483333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from tap (highlighted by a red box), light fixture (highlighted by a blue box) or toiletry (highlighted by a green box)?\n(A) light fixture\n(B) toiletry" }, { "from": "gpt", "value": "(A) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204342_14939703565166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or power outlet (highlighted by a blue box)?\n(A) chair\n(B) power outlet" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898386_367846505848833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, box (highlighted by a red box) or box (highlighted by a blue box)?\n(A) box\n(B) box" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261688_334447994208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to tap (highlighted by a red box), table (highlighted by a blue box) or wine bottle (highlighted by a green box)?\n(A) table\n(B) wine bottle" }, { "from": "gpt", "value": "(B) wine bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898454_156503094763583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, shoe (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) shoe\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331911_629257990039875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) curtain\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333647_126142819829750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, home appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) home appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670224_53959173180625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, appliance (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) appliance\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358731_6769824391375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897818_132710693876750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from lamp (highlighted by a red box)? table lamp (highlighted by a blue box) or toy (highlighted by a green box)?\n(A) table lamp\n(B) toy" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739417_191293470621166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) chair\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018188_466683046361291_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897410_103101781642708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, appliance (highlighted by a red box) or socket (highlighted by a blue box)?\n(A) appliance\n(B) socket" }, { "from": "gpt", "value": "(B) socket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899905_1027815756372750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, book (highlighted by a red box) or vanity (highlighted by a blue box)?\n(A) book\n(B) vanity" }, { "from": "gpt", "value": "(B) vanity" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429773_359926731849125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from plant (highlighted by a red box)? Choose from window box (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) window box\n(B) curtain" }, { "from": "gpt", "value": "(A) window box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260957_5982300032291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to radiator (highlighted by a red box)? Choose from door (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) door\n(B) picture frame" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204363_15796831823000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, furniture (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) furniture\n(B) footwear" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333873_76309370298916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, vanity (highlighted by a red box) or bean bag chair (highlighted by a blue box)?\n(A) vanity\n(B) bean bag chair" }, { "from": "gpt", "value": "(A) vanity" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018331_116067108941416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, droplight (highlighted by a red box) or droplight (highlighted by a blue box)?\n(A) droplight\n(B) droplight" }, { "from": "gpt", "value": "(A) droplight" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358281_9125518665916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to picture frame (highlighted by a red box)? appliance (highlighted by a blue box) or countertop (highlighted by a green box).\n(A) appliance\n(B) countertop" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261219_13588819904625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, vent (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) vent\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897951_533548622952625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bottle (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) bottle\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896365_19899848797625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window screen (highlighted by a red box) or waste container (highlighted by a blue box)?\n(A) window screen\n(B) waste container" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896589_33011542384208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to radiator (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and table (highlighted by a green box).\n(A) furniture\n(B) table" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333319_28455150099958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, houseplant (highlighted by a red box) or flower (highlighted by a blue box)?\n(A) houseplant\n(B) flower" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115416_4035761517333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649754_51826238707500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, window (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) window\n(B) window sill" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895191_38690525979583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, box (highlighted by a red box) or box (highlighted by a blue box)?\n(A) box\n(B) box" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358418_41217909488583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, furniture (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) furniture\n(B) footwear" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445594_285327533401833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to stairwell (highlighted by a red box), concrete (highlighted by a blue box) or door (highlighted by a green box)?\n(A) concrete\n(B) door" }, { "from": "gpt", "value": "(A) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018412_394255532239083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to appliance (highlighted by a red box)? home appliance (highlighted by a blue box) or sink (highlighted by a green box).\n(A) home appliance\n(B) sink" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430550_301270051765958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or plant (highlighted by a blue box)?\n(A) picture frame\n(B) plant" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739678_765816663625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) chair\n(B) concrete" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332207_264482478637333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from refrigerator (highlighted by a red box), box (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) box\n(B) bottle" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333846_74844728501958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to mat (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and tablet computer (highlighted by a green box).\n(A) studio couch\n(B) tablet computer" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429729_18975038092041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chest of drawers (highlighted by a red box), bag (highlighted by a blue box) or table (highlighted by a green box)?\n(A) bag\n(B) table" }, { "from": "gpt", "value": "(A) bag" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115422_4833902816083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bathtub (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) bathtub\n(B) bath towel" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896089_143910090447208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of studio couch (annotated by the red box) in reference to houseplant? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445444_149642016650833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toilet (highlighted by a red box)? potty (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) potty\n(B) screen door" }, { "from": "gpt", "value": "(A) potty" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895818_685950429661791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to sink (highlighted by a red box), bathtub (highlighted by a blue box) or counter top (highlighted by a green box)?\n(A) bathtub\n(B) counter top" }, { "from": "gpt", "value": "(B) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898655_572939329924708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from picture frame (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and table lamp (highlighted by a green box).\n(A) picture frame\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333264_21839814114916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, appliance (highlighted by a red box) or food (highlighted by a blue box)?\n(A) appliance\n(B) food" }, { "from": "gpt", "value": "(B) food" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897426_104144218189500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) door\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331107_135508972846666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from alphabet (highlighted by a red box)? Choose from alphabet (highlighted by a blue box) and door (highlighted by a green box).\n(A) alphabet\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895865_107704968196875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is picture frame (annotated by the red box) located in relation to oil lamp in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115158_87720192326125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from bed (highlighted by a red box)? sleeping bag (highlighted by a blue box) or blanket (highlighted by a green box)?\n(A) sleeping bag\n(B) blanket" }, { "from": "gpt", "value": "(A) sleeping bag" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018846_649974406871416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333674_134265756341583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of chest of drawers (annotated by the red box) in relation to clothing? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444588_31787296168166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from electric outlet (highlighted by a red box), appliance (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) appliance\n(B) furniture" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333876_77234369359666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, bulletin board (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) bulletin board\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828552_101484719665000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the clock (highlighted by a red box)? curtain (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) curtain\n(B) lamp" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332201_264258269564416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) chair\n(B) fireplace" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429725_19060936533666_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430904_80941269752083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, refrigerator (highlighted by a red box) or faucet (highlighted by a blue box)?\n(A) refrigerator\n(B) faucet" }, { "from": "gpt", "value": "(A) refrigerator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898720_582946477058291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, nightstand (highlighted by a red box) or bedside lamp (highlighted by a blue box)?\n(A) nightstand\n(B) bedside lamp" }, { "from": "gpt", "value": "(B) bedside lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444706_73274572025250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, light switch (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) light switch\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796691_30636344626500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from home appliance (highlighted by a red box), table (highlighted by a blue box) or clock (highlighted by a green box)?\n(A) table\n(B) clock" }, { "from": "gpt", "value": "(B) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333203_46894940570375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of table (annotated by the red box) in relation to cabinetry?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896510_33451374766000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to window (highlighted by a red box)? Select from television (highlighted by a blue box) and speaker (highlighted by a green box).\n(A) television\n(B) speaker" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115143_87168971391916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, desk (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) desk\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662806_13586892413708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bed (highlighted by a red box)? Choose among these: shelf (highlighted by a blue box) or bicycle (highlighted by a green box).\n(A) shelf\n(B) bicycle" }, { "from": "gpt", "value": "(B) bicycle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895298_91147134009875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the furniture (highlighted by a red box)? sheet (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) sheet\n(B) pillow" }, { "from": "gpt", "value": "(A) sheet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334756_421314502120791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhere is window (annotated by the red box) located in relation to window in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430904_80937271371791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from glass jar (highlighted by a red box)? Select from houseplant (highlighted by a blue box) and gift bag (highlighted by a green box).\n(A) houseplant\n(B) gift bag" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446479_355568761064958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, table lamp (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) table lamp\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430246_182449585670250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431081_75434125945375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) curtain\n(B) shelf" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897712_112163298325333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the vent (highlighted by a red box)? cabinetry (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358220_9340055997458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to table (highlighted by a red box)? Choose from door (highlighted by a blue box) and barn door (highlighted by a green box).\n(A) door\n(B) barn door" }, { "from": "gpt", "value": "(B) barn door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895258_78319980748208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chest of drawers (highlighted by a red box) or potty (highlighted by a blue box)?\n(A) chest of drawers\n(B) potty" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898195_145242924021041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or air conditioning (highlighted by a blue box)?\n(A) picture frame\n(B) air conditioning" }, { "from": "gpt", "value": "(B) air conditioning" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204330_14301816367541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from plant (highlighted by a red box)? Choose among these: chest of drawers (highlighted by a blue box) or basket container (highlighted by a green box).\n(A) chest of drawers\n(B) basket container" }, { "from": "gpt", "value": "(B) basket container" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896304_6848147630916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, refrigerator (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) refrigerator\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895279_79295911350416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or blanket (highlighted by a blue box)?\n(A) furniture\n(B) blanket" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458286_76250043444208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from pillow (highlighted by a red box)? Choose from curtain (highlighted by a blue box) and studio couch (highlighted by a green box).\n(A) curtain\n(B) studio couch" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444751_79721867378000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, kitchen appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) kitchen appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447308_409784180742166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, door (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) door\n(B) doormat" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458617_127177967994083_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332808_47989326649333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, table (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) table\n(B) screen door" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332234_755719322214416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, drawer (highlighted by a red box) or soap (highlighted by a blue box)?\n(A) drawer\n(B) soap" }, { "from": "gpt", "value": "(A) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018153_373375673993708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, paper towel (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) paper towel\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897509_472288409528791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, box (highlighted by a red box) or box (highlighted by a blue box)?\n(A) box\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430934_94934532499750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, home appliance (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) home appliance\n(B) glass door" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796498_1572072132666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, table (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) table\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898958_821359296220208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, electric outlet (highlighted by a red box) or window (highlighted by a blue box)?\n(A) electric outlet\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828478_100806743862333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) picture frame\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445168_8044525714333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from radiator (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and plain (highlighted by a green box).\n(A) furniture\n(B) plain" }, { "from": "gpt", "value": "(B) plain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430221_180193406447250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to computer (highlighted by a red box)? Select from computer monitor (highlighted by a blue box) and picnic basket (highlighted by a green box).\n(A) computer monitor\n(B) picnic basket" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431030_141402953276541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bath (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) bath\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332473_886550169576000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from window (highlighted by a red box)? man (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) man\n(B) curtain" }, { "from": "gpt", "value": "(A) man" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444758_80913768584083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chest of drawers (highlighted by a red box), laundry basket (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) laundry basket\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261490_41852358166333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the studio couch (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) pillow\n(B) curtain" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445168_7922524287958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, studio couch (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) studio couch\n(B) chair" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445676_60892216921041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) table\n(B) curtain" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899642_231988183451250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bed (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) bed\n(B) curtain" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796576_16754869974458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chest of drawers (highlighted by a red box) or mirror (highlighted by a blue box)?\n(A) chest of drawers\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649798_46152504935333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, wood burning stove (highlighted by a red box) or table (highlighted by a blue box)?\n(A) wood burning stove\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260946_4659884926458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, television (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) television\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331934_163587793997208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to kitchen appliance (highlighted by a red box)? place mat (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) place mat\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331103_135820879684166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796230_2582611848625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, screen door (highlighted by a red box) or music stool (highlighted by a blue box)?\n(A) screen door\n(B) music stool" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899898_1027094732969666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, dog (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) dog\n(B) pillow" }, { "from": "gpt", "value": "(A) dog" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018540_828192642665416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) picture frame\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429861_13403545910208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898785_67268202401582_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) picture frame\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446466_355424453253958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to shelf (highlighted by a red box)? swivel chair (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) swivel chair\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204863_2720948579541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, window (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895574_1153859235153166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of gas stove (annotated by the red box) and paper towel in the image provided, where is gas stove (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649707_47753759310875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to computer monitor (highlighted by a red box)? Select from clothing (highlighted by a blue box) and clothing (highlighted by a green box).\n(A) clothing\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204296_14327601456458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, glass door (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) glass door\n(B) cabinetry" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828562_102288772541125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, studio couch (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) studio couch\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333581_207632035047166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649720_47924954824500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, tv show (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) tv show\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896133_147098726105708_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331041_479800421355916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, door (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) door\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445619_56368403184416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bulletin board (highlighted by a red box)? round table (highlighted by a blue box) or box (highlighted by a green box)?\n(A) round table\n(B) box" }, { "from": "gpt", "value": "(A) round table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897490_471260819786416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of chair (annotated by the red box) in reference to chair? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471547817156125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) chair\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261265_13772009938125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, screen door (highlighted by a red box) or plumbing fixture (highlighted by a blue box)?\n(A) screen door\n(B) plumbing fixture" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204350_15552026235791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or table (highlighted by a blue box)?\n(A) picture frame\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332398_401509407893375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cardboard box (highlighted by a red box) or magazine (highlighted by a blue box)?\n(A) cardboard box\n(B) magazine" }, { "from": "gpt", "value": "(A) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334185_354524273540208_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897490_471178220689791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from kitchen appliance (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) appliance\n(B) bottle" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458617_127145764065875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) window\n(B) screen door" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895826_1219987677093208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window frame (highlighted by a red box), curtain (highlighted by a blue box) or window sill (highlighted by a green box)?\n(A) curtain\n(B) window sill" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670208_54105662258041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from swivel chair (highlighted by a red box)? clock (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) clock\n(B) shelf" }, { "from": "gpt", "value": "(A) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334487_104538619995041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is backpack (annotated by the red box) located in relation to backpack in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358673_859094786875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to picture frame (highlighted by a red box)? Select from window (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) window\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261317_23577486069875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, furniture (highlighted by a red box) or television (highlighted by a blue box)?\n(A) furniture\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334628_386189939950416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from toy (highlighted by a red box)? toy (highlighted by a blue box) or toy (highlighted by a green box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331421_544149117838958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is door (annotated by the red box) located in relation to bird cage in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445040_1761440344666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to pillow (highlighted by a red box)? Select from pillow (highlighted by a blue box) and shelf (highlighted by a green box).\n(A) pillow\n(B) shelf" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896042_130075251986833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, sink (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) sink\n(B) radiator" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895987_136432102599166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from book (highlighted by a red box), book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204763_26823597003416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or computer monitor (highlighted by a blue box)?\n(A) chair\n(B) computer monitor" }, { "from": "gpt", "value": "(B) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333159_41488625271541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the cabinetry (highlighted by a red box)? toy (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) toy\n(B) cabinetry" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24365800424458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from table (highlighted by a red box)? plywood (highlighted by a blue box) or table (highlighted by a green box)?\n(A) plywood\n(B) table" }, { "from": "gpt", "value": "(A) plywood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334184_354638660817250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, desk (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) desk\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899364_717510400360791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, electric outlet (highlighted by a red box) or door (highlighted by a blue box)?\n(A) electric outlet\n(B) door" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24607501349458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446485_355718349965125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of chair (annotated by the red box) in reference to table? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897478_112701148976958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to chair (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and paperback book (highlighted by a green box).\n(A) cabinetry\n(B) paperback book" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204730_23386626873750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is curtain (annotated by the red box) located in relation to window in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358162_60962728974583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the pillow (highlighted by a red box)? glass door (highlighted by a blue box) or side (highlighted by a green box).\n(A) glass door\n(B) side" }, { "from": "gpt", "value": "(B) side" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895947_109047024958375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from shelf (highlighted by a red box)? bottle (highlighted by a blue box) or soap dispenser (highlighted by a green box)?\n(A) bottle\n(B) soap dispenser" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331347_192476518816375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bookcase (highlighted by a red box) or table (highlighted by a blue box)?\n(A) bookcase\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334025_271612801946958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of refrigerator (annotated by the red box) in reference to home appliance? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429826_746664794645666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to shower (highlighted by a red box), shower (highlighted by a blue box) or radiator (highlighted by a green box)?\n(A) shower\n(B) radiator" }, { "from": "gpt", "value": "(A) shower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828449_91281235492291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from coffee table (highlighted by a red box), pillow (highlighted by a blue box) or fireplace (highlighted by a green box)?\n(A) pillow\n(B) fireplace" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331498_153782315380541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bathroom cabinet (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) bathroom cabinet\n(B) toiletry" }, { "from": "gpt", "value": "(A) bathroom cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649714_47832643224208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from door (highlighted by a red box)? radiator (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) radiator\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018808_19351785104541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of armchair (annotated by the red box) in relation to poster? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115150_86905080628458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from mirror (highlighted by a red box)? window (highlighted by a blue box) or window (highlighted by a green box)?\n(A) window\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897436_104954930572083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, mirror (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) mirror\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332113_684352005194833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, washing machine (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) washing machine\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358707_5112460823250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from basket (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and toilet paper (highlighted by a green box).\n(A) picture frame\n(B) toilet paper" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898419_1191040967625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window sill (highlighted by a red box), curtain (highlighted by a blue box) or fireplace (highlighted by a green box)?\n(A) curtain\n(B) fireplace" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331928_163303192367416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, studio couch (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) studio couch\n(B) chair" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430236_181785972249333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, washing machine (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) washing machine\n(B) cleaning product" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333014_130219113721041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from book (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331772_8590805929083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, furniture (highlighted by a red box) or table (highlighted by a blue box)?\n(A) furniture\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430928_92988182912875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, door (highlighted by a red box) or plywood (highlighted by a blue box)?\n(A) door\n(B) plywood" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649459_13942039068916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from studio couch (highlighted by a red box), book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899664_234643767857458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from window sill (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) picture frame\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018844_649819320061916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, plant (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) plant\n(B) shelf" }, { "from": "gpt", "value": "(A) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018757_14936952527041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, houseplant (highlighted by a red box) or door (highlighted by a blue box)?\n(A) houseplant\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333268_22012310501750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or fridge (highlighted by a blue box)?\n(A) furniture\n(B) fridge" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333329_30162824315708_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828311_76502537297916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of furniture (annotated by the red box) in relation to clothing?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018758_15011355826666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from exhaust hood (highlighted by a red box), table (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) table\n(B) cabinetry" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649727_49019315230875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, door (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) door\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458756_141614941673291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the stationery (highlighted by a red box)? door (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) door\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670002_29870063539916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from basket (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and window (highlighted by a green box).\n(A) cabinetry\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447287_408764605859208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, gas stove (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) gas stove\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331921_630922094010041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333233_32452270550416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, toy (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) toy\n(B) bottle" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896187_141971128374500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, scale (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) scale\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358230_10054362442916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, book (highlighted by a red box) or writing (highlighted by a blue box)?\n(A) book\n(B) writing" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334628_386176645336166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, screen door (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) screen door\n(B) lamp" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899046_645848000323791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to oval (highlighted by a red box)? screen door (highlighted by a blue box) or box (highlighted by a green box).\n(A) screen door\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898247_167676829301500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to picture frame (highlighted by a red box)? Choose from door (highlighted by a blue box) and chest of drawers (highlighted by a green box).\n(A) door\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898988_823950389838791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, radiator (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) radiator\n(B) pillow" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_5004198706750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chest of drawers (highlighted by a red box) or vase (highlighted by a blue box)?\n(A) chest of drawers\n(B) vase" }, { "from": "gpt", "value": "(B) vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261689_409151806333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or table (highlighted by a blue box)?\n(A) furniture\n(B) table" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897822_132766288529207_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from book cover (highlighted by a red box), pillow (highlighted by a blue box) or swivel chair (highlighted by a green box)?\n(A) pillow\n(B) swivel chair" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334935_663066891625291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444789_50595804992000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899643_231925991458625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bed (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) bed\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429822_744672691806083_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331346_192306504539666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to table (highlighted by a red box)? Choose from window (highlighted by a blue box) and window (highlighted by a green box).\n(A) window\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895305_90799341319750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, furniture (highlighted by a red box) or blanket (highlighted by a blue box)?\n(A) furniture\n(B) blanket" }, { "from": "gpt", "value": "(B) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458330_102973726846625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, cabinetry (highlighted by a red box) or waste container (highlighted by a blue box)?\n(A) cabinetry\n(B) waste container" }, { "from": "gpt", "value": "(B) waste container" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261569_76307326254833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from file cabinet (highlighted by a red box)? Choose among these: curtain (highlighted by a blue box) or furniture (highlighted by a green box).\n(A) curtain\n(B) furniture" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669913_12744798874333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from shower (highlighted by a red box)? light switch (highlighted by a blue box) or toilet (highlighted by a green box)?\n(A) light switch\n(B) toilet" }, { "from": "gpt", "value": "(B) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898959_821181002509458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, cabinetry (highlighted by a red box) or refrigerator (highlighted by a blue box)?\n(A) cabinetry\n(B) refrigerator" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334205_103858177662791_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261681_3622755628750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, pillow (highlighted by a red box) or plain (highlighted by a blue box)?\n(A) pillow\n(B) plain" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204381_18123926897000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, fireplace (highlighted by a red box) or bean bag chair (highlighted by a blue box)?\n(A) fireplace\n(B) bean bag chair" }, { "from": "gpt", "value": "(A) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358230_10072571554708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to pillow (highlighted by a red box)? Select from pillow (highlighted by a blue box) and nightstand (highlighted by a green box).\n(A) pillow\n(B) nightstand" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670109_41025819638416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, window (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) window\n(B) picture frame" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796684_30784949544666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to door (highlighted by a red box)? Select from doormat (highlighted by a blue box) and footwear (highlighted by a green box).\n(A) doormat\n(B) footwear" }, { "from": "gpt", "value": "(A) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333873_76295375981625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, houseplant (highlighted by a red box) or bulletin board (highlighted by a blue box)?\n(A) houseplant\n(B) bulletin board" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649714_47872643260916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from bottle (highlighted by a red box)? bottle (highlighted by a blue box) or basin (highlighted by a green box)?\n(A) bottle\n(B) basin" }, { "from": "gpt", "value": "(B) basin" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898195_145232928173625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, window (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) window\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445864_70664294496375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, cabinetry (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) cabinetry\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895491_450904069607208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, desk (highlighted by a red box) or book (highlighted by a blue box)?\n(A) desk\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261164_789904165458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, fireplace (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) fireplace\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649798_46154504144083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, tv show (highlighted by a red box) or brickwork (highlighted by a blue box)?\n(A) tv show\n(B) brickwork" }, { "from": "gpt", "value": "(A) tv show" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458706_136818462371458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, sink (highlighted by a red box) or window (highlighted by a blue box)?\n(A) sink\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429884_367786125882041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, dresser (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) dresser\n(B) curtain" }, { "from": "gpt", "value": "(A) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204296_14325602284375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) table\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261297_16389632615333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, curtain (highlighted by a red box) or shutter (highlighted by a blue box)?\n(A) curtain\n(B) shutter" }, { "from": "gpt", "value": "(B) shutter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897490_471206825511541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the microwave oven (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261533_74192223647375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, lamp (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) lamp\n(B) toy" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896484_23840704872208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from pillow (highlighted by a red box)? picture frame (highlighted by a blue box) or window screen (highlighted by a green box)?\n(A) picture frame\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649382_10572263510666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from chest of drawers (highlighted by a red box)? paperback book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) paperback book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_4980191548791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the studio couch (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) book\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895825_1220037273779791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334733_535827427731458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to television (highlighted by a red box)? Select from plain (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) plain\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334039_278743009570375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, pillow (highlighted by a red box) or table (highlighted by a blue box)?\n(A) pillow\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895994_136283814381291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to studio couch (highlighted by a red box)? table (highlighted by a blue box) or chair (highlighted by a green box).\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649384_11067210661791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from picture frame (highlighted by a red box), screen door (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) screen door\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458307_101732278942916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, storage box (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) storage box\n(B) concrete" }, { "from": "gpt", "value": "(A) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895920_112111910305833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, ball (highlighted by a red box) or treadmill (highlighted by a blue box)?\n(A) ball\n(B) treadmill" }, { "from": "gpt", "value": "(B) treadmill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430280_186403172664125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhere is refrigerator (annotated by the red box) located in relation to toy in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669917_14116259118625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, swivel chair (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) swivel chair\n(B) furniture" }, { "from": "gpt", "value": "(A) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458637_128133484040750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, screen door (highlighted by a red box) or basin (highlighted by a blue box)?\n(A) screen door\n(B) basin" }, { "from": "gpt", "value": "(B) basin" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332764_43904135160875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458772_142307241198333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, toy (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) toy\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458772_142361236452750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) window\n(B) window sill" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261169_1291160027833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) chair\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445206_10697528295500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is table (annotated by the red box) located in relation to door in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333288_25267133303833_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332585_360677938880000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, houseplant (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) houseplant\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332748_42530414446375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446576_205913539075583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, book (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) book\n(B) cardboard box" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895920_112101914443541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to furniture (highlighted by a red box)? Choose from balloon (highlighted by a blue box) and blind (highlighted by a green box).\n(A) balloon\n(B) blind" }, { "from": "gpt", "value": "(B) blind" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204304_15068170110458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or blind (highlighted by a blue box)?\n(A) table\n(B) blind" }, { "from": "gpt", "value": "(B) blind" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896199_142377140771083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to lamp (highlighted by a red box), picture frame (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) picture frame\n(B) curtain" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334761_421901734699583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the screen door (highlighted by a red box)? pillow (highlighted by a blue box) or door (highlighted by a green box).\n(A) pillow\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331508_155185920189083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cereal (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) cereal\n(B) toy" }, { "from": "gpt", "value": "(A) cereal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018328_115969898114958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, curtain (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) curtain\n(B) shelf" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898254_696666041075416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of shelf (annotated by the red box) in relation to chair? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898988_823939694220041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897419_103687889100791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bath (highlighted by a red box) or mouthwash (highlighted by a blue box)?\n(A) bath\n(B) mouthwash" }, { "from": "gpt", "value": "(A) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898254_696662042718666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from chair (highlighted by a red box)? glass door (highlighted by a blue box) or computer monitor (highlighted by a green box)?\n(A) glass door\n(B) computer monitor" }, { "from": "gpt", "value": "(B) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662874_14501270362833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of window (annotated by the red box) in reference to bed?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828478_100796748009166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of dot (annotated by the red box) in reference to light? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471537821318583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to kitchen appliance (highlighted by a red box)? door (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) door\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331893_623301536965625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of door (annotated by the red box) in reference to corridor?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445677_61052017230250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895305_90811336487041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or platter (highlighted by a blue box)?\n(A) chair\n(B) platter" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333055_60254988201750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, desk (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) desk\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896527_34778921821707_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, basket (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) basket\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895936_107847518622833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the chair (highlighted by a red box)? pillow (highlighted by a blue box) or table (highlighted by a green box).\n(A) pillow\n(B) table" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895860_489205267901791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is bed (annotated by the red box) located relative to pillow?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334273_157139270888750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from cabinetry (highlighted by a red box), speaker (highlighted by a blue box) or blanket (highlighted by a green box)?\n(A) speaker\n(B) blanket" }, { "from": "gpt", "value": "(B) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739463_51564396741916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to houseplant (highlighted by a red box), mattress (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) mattress\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334883_622623697577416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to wall clock (highlighted by a red box), glass door (highlighted by a blue box) or toy (highlighted by a green box)?\n(A) glass door\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739344_46020724974125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, computer monitor (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) computer monitor\n(B) clothing" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446140_141044570381166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to paperback book (highlighted by a red box)? Select from book (highlighted by a blue box) and book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899232_880570132630416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, toy (highlighted by a red box) or laundry (highlighted by a blue box)?\n(A) toy\n(B) laundry" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898577_183655695185916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to christmas tree (highlighted by a red box)? studio couch (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) studio couch\n(B) screen door" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669998_31356285338583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, sink (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) sink\n(B) toilet paper" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261277_14326257847375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window (highlighted by a red box), tile (highlighted by a blue box) or picnic basket (highlighted by a green box)?\n(A) tile\n(B) picnic basket" }, { "from": "gpt", "value": "(B) picnic basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331347_192526515143416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or beer bottle (highlighted by a blue box)?\n(A) cabinetry\n(B) beer bottle" }, { "from": "gpt", "value": "(B) beer bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431041_141756053547250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from swivel chair (highlighted by a red box)? Select from desk (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) desk\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018869_653388080717791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from table (highlighted by a red box)? Choose from chair (highlighted by a blue box) and magazine (highlighted by a green box).\n(A) chair\n(B) magazine" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429728_19309335054291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of cabinetry (annotated by the red box) and door in the image provided, where is cabinetry (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663322_77555670935000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, oven (highlighted by a red box) or orange (highlighted by a blue box)?\n(A) oven\n(B) orange" }, { "from": "gpt", "value": "(A) oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445680_62102359665375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to chair (highlighted by a red box)? pillow (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) pillow\n(B) picture frame" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444751_79771863433791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to refrigerator (highlighted by a red box)? Select from cardboard box (highlighted by a blue box) and stainless steel (highlighted by a green box).\n(A) cardboard box\n(B) stainless steel" }, { "from": "gpt", "value": "(A) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796226_2558921678500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table lamp (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331934_163599789129291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from counter (highlighted by a red box)? Choose among these: screen door (highlighted by a blue box) or kitchen appliance (highlighted by a green box).\n(A) screen door\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739611_200270537988875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, door (highlighted by a red box) or shower door (highlighted by a blue box)?\n(A) door\n(B) shower door" }, { "from": "gpt", "value": "(B) shower door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115624_3671095448833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, electric outlet (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) electric outlet\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333139_40054977980958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from furniture (highlighted by a red box)? Choose among these: curtain (highlighted by a blue box) or window (highlighted by a green box).\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898242_696000803546166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the helmet (highlighted by a red box)? Choose among these: furniture (highlighted by a blue box) or blanket (highlighted by a green box).\n(A) furniture\n(B) blanket" }, { "from": "gpt", "value": "(B) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458562_128140218332750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, countertop (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) countertop\n(B) bottle" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204392_22964091479666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from curtain (highlighted by a red box)? television (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) television\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331936_164598116429583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, furniture (highlighted by a red box) or material (highlighted by a blue box)?\n(A) furniture\n(B) material" }, { "from": "gpt", "value": "(B) material" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430314_264821054175000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chair (highlighted by a red box)? chair (highlighted by a blue box) or floral arrangement (highlighted by a green box)?\n(A) chair\n(B) floral arrangement" }, { "from": "gpt", "value": "(B) floral arrangement" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334920_1091107196505833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toilet (highlighted by a red box) or bathtub (highlighted by a blue box)?\n(A) toilet\n(B) bathtub" }, { "from": "gpt", "value": "(B) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334912_1089940470549583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, home appliance (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) home appliance\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897924_348981830348666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from toaster (highlighted by a red box)? Select from microwave oven (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) microwave oven\n(B) bottle" }, { "from": "gpt", "value": "(A) microwave oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358162_60946735303083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828369_92385019858583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the mat (highlighted by a red box)? table (highlighted by a blue box) or chair (highlighted by a green box).\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115136_85965928507791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, porcelain (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) porcelain\n(B) toilet paper" }, { "from": "gpt", "value": "(A) porcelain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331277_13226440835041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from shelf (highlighted by a red box)? bookcase (highlighted by a blue box) or paperback book (highlighted by a green box)?\n(A) bookcase\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333188_47305541742750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, vase (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) vase\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897898_345234796126500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, computer monitor (highlighted by a red box) or computer monitor (highlighted by a blue box)?\n(A) computer monitor\n(B) computer monitor" }, { "from": "gpt", "value": "(B) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446485_355818359050708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bed (highlighted by a red box) or nightstand (highlighted by a blue box)?\n(A) bed\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018845_649718011242125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, file cabinet (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) file cabinet\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431041_141776162055625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to sink (highlighted by a red box)? faucet (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) faucet\n(B) appliance" }, { "from": "gpt", "value": "(A) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896103_145362908361208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to picture frame (highlighted by a red box)? picture frame (highlighted by a blue box) or wood burning stove (highlighted by a green box).\n(A) picture frame\n(B) wood burning stove" }, { "from": "gpt", "value": "(B) wood burning stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458524_125820160238500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, studio couch (highlighted by a red box) or door (highlighted by a blue box)?\n(A) studio couch\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898786_67384005789916_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895994_136295809390540_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to chair (highlighted by a red box), table (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) table\n(B) cabinetry" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333778_48307626309791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the book (highlighted by a red box)? book (highlighted by a blue box) or book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430452_2056546359083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, footwear (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) footwear\n(B) footwear" }, { "from": "gpt", "value": "(A) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446574_86396063651208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018115_368424324584291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from wood (highlighted by a red box)? Choose from trash bin/can (highlighted by a blue box) and cardboard box (highlighted by a green box).\n(A) trash bin/can\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429646_8169190665750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895829_1221705822750750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, door (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) door\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897928_348902429612375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bottle (highlighted by a red box)? Choose among these: bottle (highlighted by a blue box) or countertop (highlighted by a green box).\n(A) bottle\n(B) countertop" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899913_1028265548457625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, toiletry (highlighted by a red box) or bath (highlighted by a blue box)?\n(A) toiletry\n(B) bath" }, { "from": "gpt", "value": "(B) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018339_117078908396458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or toy (highlighted by a green box).\n(A) book\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895994_136293810222708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to table lamp (highlighted by a red box), book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445680_62002368164375_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445999_134117757425791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from appliance (highlighted by a red box)? paper towel (highlighted by a blue box) or window (highlighted by a green box)?\n(A) paper towel\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828552_101592710282125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bar stool (highlighted by a red box) or book (highlighted by a blue box)?\n(A) bar stool\n(B) book" }, { "from": "gpt", "value": "(A) bar stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332795_47600102614375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) door\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11187710689500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to book cover (highlighted by a red box)? book (highlighted by a blue box) or paperback book (highlighted by a green box).\n(A) book\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333561_200737773938666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from mirror (highlighted by a red box), coffee cup (highlighted by a blue box) or sink (highlighted by a green box)?\n(A) coffee cup\n(B) sink" }, { "from": "gpt", "value": "(A) coffee cup" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796745_28732072737333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from picture frame (highlighted by a red box)? curtain (highlighted by a blue box) or desk (highlighted by a green box)?\n(A) curtain\n(B) desk" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334906_1086562123945375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) couch\n(B) pillow" }, { "from": "gpt", "value": "(A) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458447_117534594077375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the book (highlighted by a red box)? Choose among these: bean bag chair (highlighted by a blue box) or door (highlighted by a green box).\n(A) bean bag chair\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649603_36031595490708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to shelf (highlighted by a red box)? book (highlighted by a blue box) or book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897755_117638113329416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018203_467245006120958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, side cabinet (highlighted by a red box) or cupboard (highlighted by a blue box)?\n(A) side cabinet\n(B) cupboard" }, { "from": "gpt", "value": "(B) cupboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24472506711250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, houseplant (highlighted by a red box) or book (highlighted by a blue box)?\n(A) houseplant\n(B) book" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828311_76502537297916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of furniture (annotated by the red box) in reference to clothing? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331617_18230973361000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to speaker (highlighted by a red box)? Select from flower (highlighted by a blue box) and chair (highlighted by a green box).\n(A) flower\n(B) chair" }, { "from": "gpt", "value": "(A) flower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828369_92306918834083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) chair\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429720_18074650225625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from clear (highlighted by a red box)? appliance (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) appliance\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331507_155082512061500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or balloon (highlighted by a blue box)?\n(A) furniture\n(B) balloon" }, { "from": "gpt", "value": "(B) balloon" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828243_81908990217000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chest of drawers (highlighted by a red box) or medicine cabinet (highlighted by a blue box)?\n(A) chest of drawers\n(B) medicine cabinet" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796520_4085796205833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from toiletry (highlighted by a red box)? bathtub (highlighted by a blue box) or cleaning product (highlighted by a green box)?\n(A) bathtub\n(B) cleaning product" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_408900199887250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to chair (highlighted by a red box)? shelf (highlighted by a blue box) or table (highlighted by a green box).\n(A) shelf\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737721022869541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from concrete (highlighted by a red box)? Choose from table (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) table\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895245_75690990957833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the window sill (highlighted by a red box)? Choose among these: paperback book (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) paperback book\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334459_100760191445958_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796579_16772162816041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to door (highlighted by a red box), door (highlighted by a blue box) or fireplace (highlighted by a green box)?\n(A) door\n(B) fireplace" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895622_470880745943416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from toiletry (highlighted by a red box)? toiletry (highlighted by a blue box) or shower (highlighted by a green box)?\n(A) toiletry\n(B) shower" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333838_54148564403291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) chair\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898555_181928075787791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from storage box (highlighted by a red box)? book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897925_348968235940625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, lamp (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) lamp\n(B) cabinetry" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897455_469641463583458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, mirror (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) mirror\n(B) picture frame" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458260_74337047749125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from clothing (highlighted by a red box)? cardboard box (highlighted by a blue box) or storage box (highlighted by a green box)?\n(A) cardboard box\n(B) storage box" }, { "from": "gpt", "value": "(A) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115650_4727444920583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to picture frame (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) picture frame\n(B) screen door" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446488_356795857084791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cleaning product (highlighted by a red box) or product (highlighted by a blue box)?\n(A) cleaning product\n(B) product" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261541_74231324126625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, book (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) book\n(B) pillow" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663009_32386510296791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or blind (highlighted by a blue box)?\n(A) chair\n(B) blind" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899352_715969282859708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, luggage (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) luggage\n(B) concrete" }, { "from": "gpt", "value": "(A) luggage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739344_46014527537750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, studio couch (highlighted by a red box) or box (highlighted by a blue box)?\n(A) studio couch\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669856_12402450658041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window screen (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) window screen\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739612_200181839722916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to toilet paper (highlighted by a red box), counter top (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) counter top\n(B) picture frame" }, { "from": "gpt", "value": "(A) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332026_202819494013166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from mug (highlighted by a red box)? bottle (highlighted by a blue box) or gas stove (highlighted by a green box)?\n(A) bottle\n(B) gas stove" }, { "from": "gpt", "value": "(B) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649648_40271621590125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the toothbrush (highlighted by a red box)? Choose among these: toilet bowl (highlighted by a blue box) or toiletry (highlighted by a green box).\n(A) toilet bowl\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896412_16632219872208_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669978_28824288078500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bed (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) bed\n(B) desk" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669880_11240299068291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, plant (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) plant\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898983_823782192020291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bed (highlighted by a red box)? curtain (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) curtain\n(B) pillow" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649384_11073208176541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, table lamp (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) table lamp\n(B) screen door" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430950_96343261291666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from bowl (highlighted by a red box), appliance (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) appliance\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898021_220917127624208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or speaker (highlighted by a blue box)?\n(A) furniture\n(B) speaker" }, { "from": "gpt", "value": "(B) speaker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899657_234551870914750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from door (highlighted by a red box)? Select from window (highlighted by a blue box) and door (highlighted by a green box).\n(A) window\n(B) door" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430862_74301899327625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from plain (highlighted by a red box)? Choose among these: dresser (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) dresser\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896209_2198177252872_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) picture frame\n(B) armchair" }, { "from": "gpt", "value": "(B) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445955_129968354433666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to pillow (highlighted by a red box), table (highlighted by a blue box) or studio couch (highlighted by a green box)?\n(A) table\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895272_79362101119875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, studio couch (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) studio couch\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670116_41805687899916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from handbag (highlighted by a red box)? Select from computer monitor (highlighted by a blue box) and computer keyboard (highlighted by a green box).\n(A) computer monitor\n(B) computer keyboard" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430982_101732334801291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of shoe (annotated by the red box) in relation to poster? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446462_354258423391208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) picture frame\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458700_135308781511457_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, studio couch (highlighted by a red box) or blanket (highlighted by a blue box)?\n(A) studio couch\n(B) blanket" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332810_48262831484000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, refrigerator (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) refrigerator\n(B) toy" }, { "from": "gpt", "value": "(A) refrigerator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115504_12294316548791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, curtain (highlighted by a red box) or television (highlighted by a blue box)?\n(A) curtain\n(B) television" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898651_572745826985750_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333776_48167633038541_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898392_369352018137500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chest of drawers (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) chest of drawers\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828243_81856995084416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, animal (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) animal\n(B) pillow" }, { "from": "gpt", "value": "(A) animal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333876_77254361241666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to wine bottle (highlighted by a red box)? Select from cupboard (highlighted by a blue box) and electric outlet (highlighted by a green box).\n(A) cupboard\n(B) electric outlet" }, { "from": "gpt", "value": "(A) cupboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445954_129865446574791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of door (annotated by the red box) in relation to door? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333493_62627499079208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the tea pot (highlighted by a red box)? bottle (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333583_207396130117500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or coffee table (highlighted by a blue box)?\n(A) chair\n(B) coffee table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358661_1098999886247_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from lamp (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and electric outlet (highlighted by a green box).\n(A) picture frame\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445125_5232018010541_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663053_38559388615958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from faucet (highlighted by a red box)? cabinetry (highlighted by a blue box) or table (highlighted by a green box)?\n(A) cabinetry\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334139_142711927143750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from stationery (highlighted by a red box)? Choose from laptop (highlighted by a blue box) and notepad (highlighted by a green box).\n(A) laptop\n(B) notepad" }, { "from": "gpt", "value": "(A) laptop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898405_369786978521708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toilet paper (highlighted by a red box), screen door (highlighted by a blue box) or mirror (highlighted by a green box)?\n(A) screen door\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896215_4290943140915_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261323_23373187416000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to radiator (highlighted by a red box)? Choose from chair (highlighted by a blue box) and chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444754_80985156010833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, lamp (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) lamp\n(B) furniture" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261248_15196799569125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, desk (highlighted by a red box) or notebook (highlighted by a blue box)?\n(A) desk\n(B) notebook" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828282_84387693142000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, window (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) window\n(B) appliance" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444904_106228166662833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the table (highlighted by a red box)? Choose among these: electric outlet (highlighted by a blue box) or television (highlighted by a green box).\n(A) electric outlet\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331496_153633408950958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, shelf (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) shelf\n(B) cleaning product" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334207_103236802348166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of animal (annotated by the red box) in relation to pillow?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354761034568916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) picture frame\n(B) curtain" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663257_77805566303375_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896174_140818425895583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from throw pillow (highlighted by a red box)? throw pillow (highlighted by a blue box) or round table (highlighted by a green box)?\n(A) throw pillow\n(B) round table" }, { "from": "gpt", "value": "(B) round table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796477_4158918335708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toy (highlighted by a red box)? clothing (highlighted by a blue box) or toy (highlighted by a green box).\n(A) clothing\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895593_1161514174330583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to hand towel (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649634_39384242085666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cabinetry (highlighted by a red box) or medicine cabinet (highlighted by a blue box)?\n(A) cabinetry\n(B) medicine cabinet" }, { "from": "gpt", "value": "(B) medicine cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018609_632850420414958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from car (highlighted by a red box)? lamp (highlighted by a blue box) or swivel chair (highlighted by a green box)?\n(A) lamp\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333473_58539338072958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to table (highlighted by a red box)? Select from furniture (highlighted by a blue box) and throw pillow (highlighted by a green box).\n(A) furniture\n(B) throw pillow" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204322_16022056700250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from houseplant (highlighted by a red box)? Select from curtain (highlighted by a blue box) and electric outlet (highlighted by a green box).\n(A) curtain\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828476_100679046783875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, round table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) round table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446493_356416645526958_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261323_23423183381916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to door (highlighted by a red box), chair (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334040_278938913216625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, fridge (highlighted by a red box) or gas stove (highlighted by a blue box)?\n(A) fridge\n(B) gas stove" }, { "from": "gpt", "value": "(B) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333233_32432261926833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018644_636298741587375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, clothing (highlighted by a red box) or toilet (highlighted by a blue box)?\n(A) clothing\n(B) toilet" }, { "from": "gpt", "value": "(A) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331491_153175618846541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) furniture\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331617_18218978241750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, pillow (highlighted by a red box) or coffee table (highlighted by a blue box)?\n(A) pillow\n(B) coffee table" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332952_21909393835750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) chair\n(B) footwear" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796326_16278076190625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to book (highlighted by a red box)? Choose from coffee cup (highlighted by a blue box) and coffee cup (highlighted by a green box).\n(A) coffee cup\n(B) coffee cup" }, { "from": "gpt", "value": "(A) coffee cup" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898722_583034574102375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table lamp (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) table lamp\n(B) electric outlet" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899935_863168285754041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or postcard (highlighted by a blue box)?\n(A) table\n(B) postcard" }, { "from": "gpt", "value": "(B) postcard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332113_684301292295458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, sink (highlighted by a red box) or medicine cabinet (highlighted by a blue box)?\n(A) sink\n(B) medicine cabinet" }, { "from": "gpt", "value": "(B) medicine cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896209_2285374113208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, microwave oven (highlighted by a red box) or laundry (highlighted by a blue box)?\n(A) microwave oven\n(B) laundry" }, { "from": "gpt", "value": "(A) microwave oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334669_391511912597541_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896512_33376272515333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from table (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and fireplace (highlighted by a green box).\n(A) picture frame\n(B) fireplace" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828334_79021136053666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table lamp (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) table lamp\n(B) picture frame" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662791_12824980100625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, pillow (highlighted by a red box) or table (highlighted by a blue box)?\n(A) pillow\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332469_886455274536416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from gas stove (highlighted by a red box)? Choose among these: home appliance (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) home appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739646_2220147759166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from brush (highlighted by a red box)? Choose from bathtub (highlighted by a blue box) and mirror (highlighted by a green box).\n(A) bathtub\n(B) mirror" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115217_94888738763791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to appliance (highlighted by a red box)? Choose from door (highlighted by a blue box) and window (highlighted by a green box).\n(A) door\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663377_92451705314083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of radiator (annotated by the red box) in reference to window? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796326_16237876169958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, clothing (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) clothing\n(B) clothing" }, { "from": "gpt", "value": "(A) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331423_544259123641083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, box (highlighted by a red box) or book (highlighted by a blue box)?\n(A) box\n(B) book" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334487_104546616758625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from bottle (highlighted by a red box)? Choose from houseplant (highlighted by a blue box) and television (highlighted by a green box).\n(A) houseplant\n(B) television" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669854_12625458284125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, glass door (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) glass door\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897675_148501498042083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) window\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828507_102551352673666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from cabinetry (highlighted by a red box)? Select from chair (highlighted by a blue box) and round table (highlighted by a green box).\n(A) chair\n(B) round table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445680_62122351296916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the magazine (highlighted by a red box)? Choose among these: table (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) table\n(B) studio couch" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429822_744668593480583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, studio couch (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) studio couch\n(B) bed" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898621_758036307190291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bathtub (highlighted by a red box) or copy (highlighted by a blue box)?\n(A) bathtub\n(B) copy" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898501_160021787646375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chest of drawers (highlighted by a red box) or toilet bowl (highlighted by a blue box)?\n(A) chest of drawers\n(B) toilet bowl" }, { "from": "gpt", "value": "(B) toilet bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828507_102467254256166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, lamp (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) lamp\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669856_12440451599916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window (highlighted by a red box) or swivel chair (highlighted by a blue box)?\n(A) window\n(B) swivel chair" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331800_227892275389291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from swivel chair (highlighted by a red box), chair (highlighted by a blue box) or table lamp (highlighted by a green box)?\n(A) chair\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430978_101949129737750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896176_141507832917208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, furniture (highlighted by a red box) or swivel chair (highlighted by a blue box)?\n(A) furniture\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669880_11280299844500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from wine bottle (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or kitchen & dining room table (highlighted by a green box).\n(A) chair\n(B) kitchen & dining room table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331699_9526231636791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from window (highlighted by a red box)? window (highlighted by a blue box) or bay window (highlighted by a green box)?\n(A) window\n(B) bay window" }, { "from": "gpt", "value": "(B) bay window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333806_51221948140791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from toy (highlighted by a red box)? Select from toy (highlighted by a blue box) and book (highlighted by a green box).\n(A) toy\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898988_823890397748875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bed (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) bed\n(B) picture frame" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115358_4203808899750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to light fixture (highlighted by a red box)? window screen (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) window screen\n(B) cabinetry" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895249_75792082858375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to animal (highlighted by a red box)? Select from woman (highlighted by a blue box) and toy (highlighted by a green box).\n(A) woman\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334213_105730202824791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from bottle (highlighted by a red box), bottle (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897892_345202509469541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, door (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) door\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334660_390838894737458_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430439_1070462014958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from shelf (highlighted by a red box), toy (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) toy\n(B) bottle" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444781_50246798713000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430983_101597422980583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, countertop (highlighted by a red box) or couch (highlighted by a blue box)?\n(A) countertop\n(B) couch" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332651_368984572550500_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670358_67328284483416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, candle (highlighted by a red box) or window (highlighted by a blue box)?\n(A) candle\n(B) window" }, { "from": "gpt", "value": "(A) candle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261228_13788720062000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chest of drawers (highlighted by a red box) or bulletin board (highlighted by a blue box)?\n(A) chest of drawers\n(B) bulletin board" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334459_100768188211666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, curtain (highlighted by a red box) or window (highlighted by a blue box)?\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331496_153653817378666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, washing machine (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) washing machine\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018339_117078908396458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, cabinetry (highlighted by a red box) or book (highlighted by a blue box)?\n(A) cabinetry\n(B) book" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899263_883253305430333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhere is window sill (annotated by the red box) located in relation to window blind in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796446_603716617833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, mirror (highlighted by a red box) or nightstand (highlighted by a blue box)?\n(A) mirror\n(B) nightstand" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649459_13932026363750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from furniture (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331010_181958784340125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, fancy dress (highlighted by a red box) or laundry (highlighted by a blue box)?\n(A) fancy dress\n(B) laundry" }, { "from": "gpt", "value": "(A) fancy dress" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649615_36986571968500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896101_145179201278791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) door\n(B) radiator" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895279_79237901576500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to cabinetry (highlighted by a red box), kitchen appliance (highlighted by a blue box) or tea pot (highlighted by a green box)?\n(A) kitchen appliance\n(B) tea pot" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429947_140098421081000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, radiator (highlighted by a red box) or cabinet (highlighted by a blue box)?\n(A) radiator\n(B) cabinet" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796443_821409579041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table lamp (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) table lamp\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669903_12288126400541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from electric outlet (highlighted by a red box)? curtain (highlighted by a blue box) or concrete (highlighted by a green box)?\n(A) curtain\n(B) concrete" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670122_41718890663375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of door (annotated by the red box) in reference to cabinetry? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358418_41191920253583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or light (highlighted by a blue box)?\n(A) picture frame\n(B) light" }, { "from": "gpt", "value": "(B) light" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115358_4171805542291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from picture frame (highlighted by a red box)? Choose from window (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) window\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895585_1159997343315875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the animal (highlighted by a red box)? door (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) door\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333288_25331823689875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, houseplant (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) houseplant\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896188_141869418629500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, art (highlighted by a red box) or droplight (highlighted by a blue box)?\n(A) art\n(B) droplight" }, { "from": "gpt", "value": "(B) droplight" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333827_53262748270958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from soap (highlighted by a red box)? Choose from ledge (highlighted by a blue box) and towel bar (highlighted by a green box).\n(A) ledge\n(B) towel bar" }, { "from": "gpt", "value": "(B) towel bar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017950_455702899660833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the lamp (highlighted by a red box)? table (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) table\n(B) lamp" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899041_645670407345333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018901_655370887484708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, lamp (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) lamp\n(B) toy" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261228_13676716705375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to appliance (highlighted by a red box)? bottle (highlighted by a blue box) or chair (highlighted by a green box).\n(A) bottle\n(B) chair" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331525_191705699234291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to bidet (highlighted by a red box)? washing machine (highlighted by a blue box) or chair (highlighted by a green box).\n(A) washing machine\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444712_73967719487875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, power plugs and sockets (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) power plugs and sockets\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895448_129501087371291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, washing machine (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) washing machine\n(B) doormat" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017888_79827811877666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window sill (highlighted by a red box) or plant (highlighted by a blue box)?\n(A) window sill\n(B) plant" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444789_50563401716250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, home appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) home appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261653_1292035374458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or door (highlighted by a blue box)?\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331707_11143923657750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from sink (highlighted by a red box), faucet (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) faucet\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649688_36004459743666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the cabinetry (highlighted by a red box)? clothing (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) clothing\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331915_629315000359500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, cabinetry (highlighted by a red box) or computer monitor (highlighted by a blue box)?\n(A) cabinetry\n(B) computer monitor" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896209_2214170576000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, appliance (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) appliance\n(B) armchair" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669937_14951597536708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bath mat (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) bath mat\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018404_393286490536500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from couch (highlighted by a red box), mirror (highlighted by a blue box) or robe (highlighted by a green box)?\n(A) mirror\n(B) robe" }, { "from": "gpt", "value": "(B) robe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899318_887509798698291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) door\n(B) footwear" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458729_138449715989791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from cleaning product (highlighted by a red box)? Choose among these: cleaning product (highlighted by a blue box) or bathtub (highlighted by a green box).\n(A) cleaning product\n(B) bathtub" }, { "from": "gpt", "value": "(B) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663250_75112084894375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to couch (highlighted by a red box)? Choose from coffee table (highlighted by a blue box) and paperback book (highlighted by a green box).\n(A) coffee table\n(B) paperback book" }, { "from": "gpt", "value": "(A) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430269_185653609289250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bookcase (highlighted by a red box) or book (highlighted by a blue box)?\n(A) bookcase\n(B) book" }, { "from": "gpt", "value": "(A) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331103_135852883337290_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445841_69216254715624_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from pillow (highlighted by a red box)? Select from table lamp (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828231_69937425671332_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, woman (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) woman\n(B) glass door" }, { "from": "gpt", "value": "(A) woman" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204736_24091343979083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471511815478250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the studio couch (highlighted by a red box)? chair (highlighted by a blue box) or box (highlighted by a green box).\n(A) chair\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444751_79777860958166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, light switch (highlighted by a red box) or window (highlighted by a blue box)?\n(A) light switch\n(B) window" }, { "from": "gpt", "value": "(A) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204296_14353590690291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, furniture (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) furniture\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429939_139226030050833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bookshelf (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or counter top (highlighted by a green box).\n(A) appliance\n(B) counter top" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429855_12680752817250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, flowerpot (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) flowerpot\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895245_75692990139583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bed (highlighted by a red box) or window (highlighted by a blue box)?\n(A) bed\n(B) window" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899936_863389277536666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115504_12300314177208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) window\n(B) paperback book" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333803_51506849063291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, tableware (highlighted by a red box) or tableware (highlighted by a blue box)?\n(A) tableware\n(B) tableware" }, { "from": "gpt", "value": "(A) tableware" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331180_277485801391041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the swivel chair (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) chair\n(B) screen door" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260873_7493653762291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, animal (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) animal\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899002_640961816481416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, counter top (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) counter top\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446576_205907441595458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from pillow (highlighted by a red box)? houseplant (highlighted by a blue box) or window (highlighted by a green box)?\n(A) houseplant\n(B) window" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898393_369434018476583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to door (highlighted by a red box), screen door (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) screen door\n(B) cabinetry" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204453_23067583557708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from television (highlighted by a red box)? Select from lamp (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332044_207175379669791_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333283_25457422472000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, garage door (highlighted by a red box) or window frame (highlighted by a blue box)?\n(A) garage door\n(B) window frame" }, { "from": "gpt", "value": "(A) garage door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649774_43560199395041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the paper bag (highlighted by a red box)? Choose among these: lamp (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115376_1808092184583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) window\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358121_62425090757500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from curtain (highlighted by a red box)? appliance (highlighted by a blue box) or countertop (highlighted by a green box)?\n(A) appliance\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898256_696456043837958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, furniture (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) furniture\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430931_92899369096583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to counter top (highlighted by a red box), sweat pant (highlighted by a blue box) or bedding (highlighted by a green box)?\n(A) sweat pant\n(B) bedding" }, { "from": "gpt", "value": "(A) sweat pant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331346_192250510550250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to cabinetry (highlighted by a red box)? Choose from lamp (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) lamp\n(B) houseplant" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331154_181656719084000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhere is light fixture (annotated by the red box) located in relation to bath in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895863_107818171307375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, lamp (highlighted by a red box) or watering can (highlighted by a blue box)?\n(A) lamp\n(B) watering can" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261357_25852222349500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, baby carriage (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) baby carriage\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11195707370958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, round table (highlighted by a red box) or tableware (highlighted by a blue box)?\n(A) round table\n(B) tableware" }, { "from": "gpt", "value": "(A) round table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430824_67633660447457_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chest of drawers (highlighted by a red box) or computer desk (highlighted by a blue box)?\n(A) chest of drawers\n(B) computer desk" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430220_180126000289708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, amplifier (highlighted by a red box) or window (highlighted by a blue box)?\n(A) amplifier\n(B) window" }, { "from": "gpt", "value": "(A) amplifier" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331080_133676685445874_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window blind (highlighted by a red box) or bay window (highlighted by a blue box)?\n(A) window blind\n(B) bay window" }, { "from": "gpt", "value": "(B) bay window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331490_153026612811750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the houseplant (highlighted by a red box)? Choose among these: round table (highlighted by a blue box) or book (highlighted by a green box).\n(A) round table\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895191_38712433734791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, mirror (highlighted by a red box) or flower (highlighted by a blue box)?\n(A) mirror\n(B) flower" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334464_100925290972083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to appliance (highlighted by a red box)? Choose from shelf (highlighted by a blue box) and comic book (highlighted by a green box).\n(A) shelf\n(B) comic book" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896009_137242264592250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896234_6923267608416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the picture frame (highlighted by a red box)? drawer (highlighted by a blue box) or chair (highlighted by a green box).\n(A) drawer\n(B) chair" }, { "from": "gpt", "value": "(A) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828282_84423694911041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or window (highlighted by a blue box)?\n(A) cabinetry\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828150_73454113392583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is stool (annotated by the red box) located in relation to stool in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334853_615533439653916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, laundry basket (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) laundry basket\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430212_688683346369458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018273_794980085051125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, refrigerator (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) refrigerator\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896083_144011898312291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, side (highlighted by a red box) or waste container (highlighted by a blue box)?\n(A) side\n(B) waste container" }, { "from": "gpt", "value": "(B) waste container" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331762_7366247751500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of table (annotated by the red box) in reference to furniture?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333803_51592847368916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, book (highlighted by a red box) or bedside lamp (highlighted by a blue box)?\n(A) book\n(B) bedside lamp" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018542_829040869937000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bed (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) bed\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430934_94926535745875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bowl (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bowl\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261641_665797829750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018609_632863115260375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of chair (annotated by the red box) in reference to chair? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458330_103042514888875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to table (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and studio couch (highlighted by a green box).\n(A) pillow\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739315_44735911731000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from plant (highlighted by a red box)? Choose from window (highlighted by a blue box) and mirror (highlighted by a green box).\n(A) window\n(B) mirror" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332564_905960634379125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the table (highlighted by a red box)? Choose among these: table lamp (highlighted by a blue box) or book (highlighted by a green box).\n(A) table lamp\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458561_128015220204541_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the door (highlighted by a red box)? cleaning product (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) cleaning product\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897777_129026518590750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) door\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895231_73985596940000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cabinetry (highlighted by a red box) or backdrop (highlighted by a blue box)?\n(A) cabinetry\n(B) backdrop" }, { "from": "gpt", "value": "(B) backdrop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331818_228828347416041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, mouthwash (highlighted by a red box) or mouthwash (highlighted by a blue box)?\n(A) mouthwash\n(B) mouthwash" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896216_4200547499208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, towel (highlighted by a red box) or towel (highlighted by a blue box)?\n(A) towel\n(B) towel" }, { "from": "gpt", "value": "(A) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458675_9285697349375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from floral arrangement (highlighted by a red box), coffee table (highlighted by a blue box) or studio couch (highlighted by a green box)?\n(A) coffee table\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898037_222238825216708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, appliance (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) appliance\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444692_72752773679916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from wall clock (highlighted by a red box)? appliance (highlighted by a blue box) or countertop (highlighted by a green box)?\n(A) appliance\n(B) countertop" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445987_132247080831875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to nightstand (highlighted by a red box)? radiator (highlighted by a blue box) or bed (highlighted by a green box).\n(A) radiator\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333827_53276759256333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018407_393217185895458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, clothing (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) clothing\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429766_358304150982125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toilet (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) toilet\n(B) toilet paper" }, { "from": "gpt", "value": "(A) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444923_220942437218250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to flyer (highlighted by a red box)? Select from passage (highlighted by a blue box) and sink (highlighted by a green box).\n(A) passage\n(B) sink" }, { "from": "gpt", "value": "(A) passage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898254_696700027104375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to book (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898785_67276215846000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to table (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and glass plate (highlighted by a green box).\n(A) pillow\n(B) glass plate" }, { "from": "gpt", "value": "(B) glass plate" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429835_748743934405166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, storage box (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) storage box\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444869_97896777233791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from christmas tree (highlighted by a red box)? Select from candle (highlighted by a blue box) and window screen (highlighted by a green box).\n(A) candle\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334028_273549704647833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) cabinetry\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897478_112693152140583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the table lamp (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or nightstand (highlighted by a green box).\n(A) chair\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649732_49781186829333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, shelf (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) shelf\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444791_51655978075416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to drawer (highlighted by a red box)? Select from bathroom cabinet (highlighted by a blue box) and bidet (highlighted by a green box).\n(A) bathroom cabinet\n(B) bidet" }, { "from": "gpt", "value": "(A) bathroom cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204741_25174084340208_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331491_153139616840291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bed (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) bed\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662891_19483503779500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is ball (annotated by the red box) located relative to table lamp? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896103_145300900799083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or door (highlighted by a blue box)?\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444588_31807304718583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of picture frame (annotated by the red box) in relation to picture frame?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796590_17526684197708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to toiletry (highlighted by a red box)? Select from tap (highlighted by a blue box) and sink (highlighted by a green box).\n(A) tap\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11243704108958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, book (highlighted by a red box) or table (highlighted by a blue box)?\n(A) book\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670184_51639742026125_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895972_406453552828791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, couple (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) couple\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333040_59756264967250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) chair\n(B) bottle" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334920_1091093901881250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of toilet paper (annotated by the red box) and bath mat in the image provided, where is toilet paper (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358257_6794871243375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of soap dispenser (annotated by the red box) in relation to tap?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333055_60300486409958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window (highlighted by a red box) or window blind (highlighted by a blue box)?\n(A) window\n(B) window blind" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669903_12290125607875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the electric outlet (highlighted by a red box)? electric outlet (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) electric outlet\n(B) picture frame" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670208_54059664744291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, clock (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) clock\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895904_110584542332166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895286_80183543725500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, drawer (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) drawer\n(B) footwear" }, { "from": "gpt", "value": "(A) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896524_34642728282500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to toy (highlighted by a red box)? Select from toy (highlighted by a blue box) and basket (highlighted by a green box).\n(A) toy\n(B) basket" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332469_886507270227458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the picture frame (highlighted by a red box)? Choose among these: studio couch (highlighted by a blue box) or door (highlighted by a green box).\n(A) studio couch\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828442_91342127982541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from appliance (highlighted by a red box), umbrella (highlighted by a blue box) or door (highlighted by a green box)?\n(A) umbrella\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261339_23867450756875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, stool (highlighted by a red box) or wall clock (highlighted by a blue box)?\n(A) stool\n(B) wall clock" }, { "from": "gpt", "value": "(A) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796475_4326732067416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to table (highlighted by a red box)? Select from toy (highlighted by a blue box) and toy (highlighted by a green box).\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895231_74098383930541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, wrap (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) wrap\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333618_76345631051166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, stainless steel (highlighted by a red box) or banana (highlighted by a blue box)?\n(A) stainless steel\n(B) banana" }, { "from": "gpt", "value": "(A) stainless steel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429736_19951059417500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, shelf (highlighted by a red box) or book (highlighted by a blue box)?\n(A) shelf\n(B) book" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670016_30465981990916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window (highlighted by a red box), curtain (highlighted by a blue box) or mirror (highlighted by a green box)?\n(A) curtain\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458525_125916753570291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is studio couch (annotated by the red box) located relative to curtain?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429739_20166071733333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, computer chair (highlighted by a red box) or ball (highlighted by a blue box)?\n(A) computer chair\n(B) ball" }, { "from": "gpt", "value": "(B) ball" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261681_3634750660291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, gadget (highlighted by a red box) or extension cord (highlighted by a blue box)?\n(A) gadget\n(B) extension cord" }, { "from": "gpt", "value": "(B) extension cord" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260873_7539651211875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from home appliance (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and desk (highlighted by a green box).\n(A) picture frame\n(B) desk" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670323_65690789135540_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, curtain (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) curtain\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261230_13437515975083_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897509_472266401898416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of dumbbell (annotated by the red box) and table in the image provided, where is dumbbell (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429728_19232433214375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, nightstand (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446072_80505567069291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, sink (highlighted by a red box) or porcelain (highlighted by a blue box)?\n(A) sink\n(B) porcelain" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663322_77705658469041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, kitchen appliance (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) kitchen appliance\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898988_823941693403333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from pillow (highlighted by a red box)? Choose among these: window screen (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) window screen\n(B) pillow" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796475_4292929430750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toy (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) toy\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334055_86024498526958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of furniture (annotated by the red box) in reference to furniture? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897783_129430233629000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, bidet (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) bidet\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358380_18928852863333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from picture frame (highlighted by a red box)? pillow (highlighted by a blue box) or table (highlighted by a green box)?\n(A) pillow\n(B) table" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663312_76634375217791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, sink (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) sink\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331631_20002442767333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, dresser (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) dresser\n(B) counter top" }, { "from": "gpt", "value": "(A) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899043_645744110135333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from sink (highlighted by a red box), plain (highlighted by a blue box) or soap (highlighted by a green box)?\n(A) plain\n(B) soap" }, { "from": "gpt", "value": "(A) plain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739844_17161125499582_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, mat (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) mat\n(B) concrete" }, { "from": "gpt", "value": "(A) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331207_279299283154583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, coffee table (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) coffee table\n(B) window screen" }, { "from": "gpt", "value": "(A) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333785_48929978321166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, tap (highlighted by a red box) or food (highlighted by a blue box)?\n(A) tap\n(B) food" }, { "from": "gpt", "value": "(B) food" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430677_326568081360916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bottle (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) bottle\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895824_1219924669116208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window sill (highlighted by a red box) or table (highlighted by a blue box)?\n(A) window sill\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897631_139538462899250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, nightstand (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) nightstand\n(B) table lamp" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670075_38573514909333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to door (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and door (highlighted by a green box).\n(A) furniture\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895610_469714556944083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of clothing (annotated by the red box) in reference to furniture? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458447_117502590660333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bicycle (highlighted by a red box)? bicycle (highlighted by a blue box) or gas stove (highlighted by a green box)?\n(A) bicycle\n(B) gas stove" }, { "from": "gpt", "value": "(B) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115634_3541996501875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, gas stove (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) gas stove\n(B) appliance" }, { "from": "gpt", "value": "(A) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018544_828928965477166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, toilet (highlighted by a red box) or material (highlighted by a blue box)?\n(A) toilet\n(B) material" }, { "from": "gpt", "value": "(B) material" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261532_74108424987750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to pillow (highlighted by a red box), pillow (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333268_22050311651833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, oven (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) oven\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204517_771169084708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: electric outlet (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) electric outlet\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897490_471242827252458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, studio couch (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) studio couch\n(B) chair" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897655_147191783619791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, gas stove (highlighted by a red box) or kettle (highlighted by a blue box)?\n(A) gas stove\n(B) kettle" }, { "from": "gpt", "value": "(B) kettle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897537_473520894815708_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358112_61757596373250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the picture frame (highlighted by a red box)? wall clock (highlighted by a blue box) or bath (highlighted by a green box).\n(A) wall clock\n(B) bath" }, { "from": "gpt", "value": "(B) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333625_76913561439916_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444716_75537866892958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from perfume (highlighted by a red box)? Choose from mouthwash (highlighted by a blue box) and ledge (highlighted by a green box).\n(A) mouthwash\n(B) ledge" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331346_192304505350458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bookcase (highlighted by a red box) or folding chair (highlighted by a blue box)?\n(A) bookcase\n(B) folding chair" }, { "from": "gpt", "value": "(B) folding chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444907_106190065556791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the radiator (highlighted by a red box)? appliance (highlighted by a blue box) or door (highlighted by a green box).\n(A) appliance\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896096_144230790899541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from picture frame (highlighted by a red box), chair (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898191_145172220050875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or person (highlighted by a blue box)?\n(A) picture frame\n(B) person" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670028_32356501460041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the toaster (highlighted by a red box)? appliance (highlighted by a blue box) or countertop (highlighted by a green box).\n(A) appliance\n(B) countertop" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261722_2915706637708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, studio couch (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) studio couch\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429860_13521248215333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from television (highlighted by a red box)? Choose among these: chest of drawers (highlighted by a blue box) or plain (highlighted by a green box).\n(A) chest of drawers\n(B) plain" }, { "from": "gpt", "value": "(B) plain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261689_385144628416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from radiator (highlighted by a red box)? furniture (highlighted by a blue box) or door (highlighted by a green box)?\n(A) furniture\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895587_1160160543932166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, radiator (highlighted by a red box) or drawer (highlighted by a blue box)?\n(A) radiator\n(B) drawer" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796709_27455090075583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, armchair (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) armchair\n(B) picture frame" }, { "from": "gpt", "value": "(A) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333281_25646528457333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from dumbbell (highlighted by a red box)? Select from chair (highlighted by a blue box) and beach towel (highlighted by a green box).\n(A) chair\n(B) beach towel" }, { "from": "gpt", "value": "(B) beach towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899935_863070775936708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cabinetry (highlighted by a red box) or light fixture (highlighted by a blue box)?\n(A) cabinetry\n(B) light fixture" }, { "from": "gpt", "value": "(B) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899030_642999080451083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from book (highlighted by a red box), book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332597_363079120079083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, doormat (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) doormat\n(B) doormat" }, { "from": "gpt", "value": "(A) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332774_44457647956916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895633_471758399969958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the Wii controller (highlighted by a red box)? Choose among these: furniture (highlighted by a blue box) or armchair (highlighted by a green box).\n(A) furniture\n(B) armchair" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332817_49117502119166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of screen door (annotated by the red box) in relation to clothing? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115650_4759648844125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from screen door (highlighted by a red box)? Select from window frame (highlighted by a blue box) and barn door (highlighted by a green box).\n(A) window frame\n(B) barn door" }, { "from": "gpt", "value": "(B) barn door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445902_68244582512333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from chair (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or table (highlighted by a green box).\n(A) cabinetry\n(B) table" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897757_117807209867791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), table lamp (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) table lamp\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796575_16902675448581_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table lamp (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334208_105517888917458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from toiletry (highlighted by a red box)? door (highlighted by a blue box) or step stool (highlighted by a green box)?\n(A) door\n(B) step stool" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898696_580861680974541_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261344_24195337790750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cabinetry (highlighted by a red box)? Choose from exhaust hood (highlighted by a blue box) and tap (highlighted by a green box).\n(A) exhaust hood\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333494_62317591506041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from light fixture (highlighted by a red box), studio couch (highlighted by a blue box) or clock (highlighted by a green box)?\n(A) studio couch\n(B) clock" }, { "from": "gpt", "value": "(B) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444574_31927805789666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is electric outlet (annotated by the red box) located relative to furniture? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261164_757916819666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, studio couch (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) studio couch\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115427_4875602988458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to drawer (highlighted by a red box)? Choose from toilet paper (highlighted by a blue box) and bathroom cabinet (highlighted by a green box).\n(A) toilet paper\n(B) bathroom cabinet" }, { "from": "gpt", "value": "(B) bathroom cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331910_627523877558208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, desk (highlighted by a red box) or computer (highlighted by a blue box)?\n(A) desk\n(B) computer" }, { "from": "gpt", "value": "(B) computer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332290_385309591802750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bottle (highlighted by a red box) or tile (highlighted by a blue box)?\n(A) bottle\n(B) tile" }, { "from": "gpt", "value": "(B) tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334935_663028890336125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or fabric (highlighted by a blue box)?\n(A) chair\n(B) fabric" }, { "from": "gpt", "value": "(B) fabric" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115634_3509992488416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) picture frame\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018853_650474261466916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, cleaning product (highlighted by a red box) or bath (highlighted by a blue box)?\n(A) cleaning product\n(B) bath" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333331_29905828919458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from washing machine (highlighted by a red box)? Choose from towel (highlighted by a blue box) and towel (highlighted by a green box).\n(A) towel\n(B) towel" }, { "from": "gpt", "value": "(B) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115158_87638992589416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the window sill (highlighted by a red box)? bed (highlighted by a blue box) or table lamp (highlighted by a green box).\n(A) bed\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897757_117855223254291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) chair\n(B) glass door" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332046_208813936148916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, clothing (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) clothing\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898461_156571283172833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to mirror (highlighted by a red box)? Select from screen door (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) screen door\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444925_220797546341208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, screen door (highlighted by a red box) or sticker (highlighted by a blue box)?\n(A) screen door\n(B) sticker" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895975_406314659824750_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458634_127497875020125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670291_62378623012958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) table\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898023_221061236159500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from glass vase (highlighted by a red box)? window (highlighted by a blue box) or round table (highlighted by a green box)?\n(A) window\n(B) round table" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430773_338906942265916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cardboard box (highlighted by a red box)? bean bag chair (highlighted by a blue box) or bean bag chair (highlighted by a green box)?\n(A) bean bag chair\n(B) bean bag chair" }, { "from": "gpt", "value": "(A) bean bag chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458582_1554874526458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bath (highlighted by a red box)? Choose among these: counter top (highlighted by a blue box) or porcelain (highlighted by a green box).\n(A) counter top\n(B) porcelain" }, { "from": "gpt", "value": "(B) porcelain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895911_493969910433791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toiletry (highlighted by a red box)? medicine cabinet (highlighted by a blue box) or toilet (highlighted by a green box).\n(A) medicine cabinet\n(B) toilet" }, { "from": "gpt", "value": "(B) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670334_66412195881916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to oven (highlighted by a red box)? Select from gas stove (highlighted by a blue box) and bath towel (highlighted by a green box).\n(A) gas stove\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649774_43540207307791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899030_642999080451083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, shelf (highlighted by a red box) or bookcase (highlighted by a blue box)?\n(A) shelf\n(B) bookcase" }, { "from": "gpt", "value": "(B) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898785_67319115254125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of chair (annotated by the red box) in relation to furniture? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115180_104092048815750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from curtain (highlighted by a red box)? lamp (highlighted by a blue box) or window (highlighted by a green box)?\n(A) lamp\n(B) window" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899654_233410264715750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to curtain (highlighted by a red box)? door (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) door\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896101_145153212035166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the curtain (highlighted by a red box)? curtain (highlighted by a blue box) or window (highlighted by a green box).\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430860_74434597113750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, file cabinet (highlighted by a red box) or table (highlighted by a blue box)?\n(A) file cabinet\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261486_41822869824041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, furniture (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) furniture\n(B) radiator" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670350_67422580503041_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898587_184563783589833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670008_30407588439083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the picture frame (highlighted by a red box)? fireplace (highlighted by a blue box) or window (highlighted by a green box).\n(A) fireplace\n(B) window" }, { "from": "gpt", "value": "(A) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429830_748550729071666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to cardboard box (highlighted by a red box), box (highlighted by a blue box) or glass door (highlighted by a green box)?\n(A) box\n(B) glass door" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897410_103091785792041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from appliance (highlighted by a red box)? Choose among these: kitchen appliance (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) kitchen appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358731_6799829190333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of chair (annotated by the red box) in reference to mat? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115401_3229760267958_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458437_117581491310333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from countertop (highlighted by a red box)? screen door (highlighted by a blue box) or home appliance (highlighted by a green box)?\n(A) screen door\n(B) home appliance" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261681_3596649772708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from picture frame (highlighted by a red box)? Select from pillow (highlighted by a blue box) and window screen (highlighted by a green box).\n(A) pillow\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828393_94670099608125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bathtub (highlighted by a red box)? mirror (highlighted by a blue box) or window frame (highlighted by a green box).\n(A) mirror\n(B) window frame" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331091_134646720006458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, table (highlighted by a red box) or storage box (highlighted by a blue box)?\n(A) table\n(B) storage box" }, { "from": "gpt", "value": "(B) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333674_134213760853082_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) chair\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332606_363412312236125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, houseplant (highlighted by a red box) or vanity (highlighted by a blue box)?\n(A) houseplant\n(B) vanity" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670197_53442206816083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from stool (highlighted by a red box)? Choose among these: desk (highlighted by a blue box) or book (highlighted by a green box).\n(A) desk\n(B) book" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649409_10268687222291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) picture frame\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331258_285789702570250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, armchair (highlighted by a red box) or laptop (highlighted by a blue box)?\n(A) armchair\n(B) laptop" }, { "from": "gpt", "value": "(A) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261153_609608920500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the pillow (highlighted by a red box)? studio couch (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331618_18011379221625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of shelf (annotated by the red box) in relation to speaker?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895186_37760677816541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from swivel chair (highlighted by a red box)? plastic bag (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) plastic bag\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739940_17381507746873_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from plant (highlighted by a red box)? home appliance (highlighted by a blue box) or oven (highlighted by a green box)?\n(A) home appliance\n(B) oven" }, { "from": "gpt", "value": "(B) oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017890_80989457359208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from bowl (highlighted by a red box)? faucet (highlighted by a blue box) or gas stove (highlighted by a green box)?\n(A) faucet\n(B) gas stove" }, { "from": "gpt", "value": "(A) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204381_18143935651875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bookshelf (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) bookshelf\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204800_24099126422333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhere is door (annotated by the red box) located in relation to door in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663227_66789166592666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, footwear (highlighted by a red box) or fabric (highlighted by a blue box)?\n(A) footwear\n(B) fabric" }, { "from": "gpt", "value": "(B) fabric" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445612_56510211078041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to electric outlet (highlighted by a red box)? Select from gas stove (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) gas stove\n(B) cabinetry" }, { "from": "gpt", "value": "(A) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649787_45943004509208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, curtain (highlighted by a red box) or door (highlighted by a blue box)?\n(A) curtain\n(B) door" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899654_233487967155291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from letter (highlighted by a red box)? Choose from letter (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) letter\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358362_16383368787708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, remote (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) remote\n(B) paperback book" }, { "from": "gpt", "value": "(A) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430928_92943584426875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to pillow (highlighted by a red box), desk (highlighted by a blue box) or clothing (highlighted by a green box)?\n(A) desk\n(B) clothing" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115363_1041364235583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261641_685806202041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331211_281194248512250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the design (highlighted by a red box)? bed (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) bed\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444869_97900775616125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to shelf (highlighted by a red box)? shoe (highlighted by a blue box) or door (highlighted by a green box).\n(A) shoe\n(B) door" }, { "from": "gpt", "value": "(A) shoe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670044_33353412265624_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toy (highlighted by a red box), bulletin board (highlighted by a blue box) or toy (highlighted by a green box)?\n(A) bulletin board\n(B) toy" }, { "from": "gpt", "value": "(A) bulletin board" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897509_472252407637458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, dumbbell (highlighted by a red box) or table (highlighted by a blue box)?\n(A) dumbbell\n(B) table" }, { "from": "gpt", "value": "(A) dumbbell" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828245_81706490708791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, curtain (highlighted by a red box) or shower curtain (highlighted by a blue box)?\n(A) curtain\n(B) shower curtain" }, { "from": "gpt", "value": "(B) shower curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334935_663034887911375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, table (highlighted by a red box) or entertainment center (highlighted by a blue box)?\n(A) table\n(B) entertainment center" }, { "from": "gpt", "value": "(B) entertainment center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204800_24081133558416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from door (highlighted by a red box)? Choose from refrigerator (highlighted by a blue box) and armchair (highlighted by a green box).\n(A) refrigerator\n(B) armchair" }, { "from": "gpt", "value": "(B) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649774_43582207348916_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333882_77126463135666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) picture frame\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663007_32278121982708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or window (highlighted by a blue box)?\n(A) picture frame\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331143_177734639913708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, door (highlighted by a red box) or water cooler (highlighted by a blue box)?\n(A) door\n(B) water cooler" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261695_551745427666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, electric outlet (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) electric outlet\n(B) cabinetry" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115158_87724190671833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of pillow (annotated by the red box) in reference to material?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898221_164095828405166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332109_683187801423916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to plain (highlighted by a red box)? table (highlighted by a blue box) or table lamp (highlighted by a green box).\n(A) table\n(B) table lamp" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332956_22056400767458_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663322_77563667611375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the curtain (highlighted by a red box)? table (highlighted by a blue box) or chair (highlighted by a green box).\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334514_64378760156333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from mirror (highlighted by a red box)? Select from sink (highlighted by a blue box) and toilet paper (highlighted by a green box).\n(A) sink\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018828_647418980599625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of studio couch (annotated by the red box) and blanket in the image provided, where is studio couch (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331277_13135744741291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the houseplant (highlighted by a red box)? Choose among these: curtain (highlighted by a blue box) or radiator (highlighted by a green box).\n(A) curtain\n(B) radiator" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358345_15202816272125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the book (highlighted by a red box)? book (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) book\n(B) picture frame" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895995_136166413138166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from picture frame (highlighted by a red box)? lamp (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) lamp\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445583_283637559872750_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739463_51522397443041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to mirror (highlighted by a red box)? trash bin/can (highlighted by a blue box) or door (highlighted by a green box).\n(A) trash bin/can\n(B) door" }, { "from": "gpt", "value": "(A) trash bin/can" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332991_125354084918791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to book (highlighted by a red box), book (highlighted by a blue box) or toy (highlighted by a green box)?\n(A) book\n(B) toy" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334185_354556260676000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from book (highlighted by a red box)? book cover (highlighted by a blue box) or table (highlighted by a green box)?\n(A) book cover\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445782_64420282620125_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828476_100575056477208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cabinetry (highlighted by a red box) or bulletin board (highlighted by a blue box)?\n(A) cabinetry\n(B) bulletin board" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429841_11955265681958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from oven (highlighted by a red box)? Choose from kitchen appliance (highlighted by a blue box) and kitchen appliance (highlighted by a green box).\n(A) kitchen appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896160_139896078300500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from cleaning product (highlighted by a red box)? Select from shelf (highlighted by a blue box) and cleaning product (highlighted by a green box).\n(A) shelf\n(B) cleaning product" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358645_3121534522291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from saucer (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and coffee cup (highlighted by a green box).\n(A) picture frame\n(B) coffee cup" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739740_3744099033125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, curtain (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) curtain\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898577_183685699939833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toy (highlighted by a red box) or window frame (highlighted by a blue box)?\n(A) toy\n(B) window frame" }, { "from": "gpt", "value": "(B) window frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895896_109602418382625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bird (highlighted by a red box) or book (highlighted by a blue box)?\n(A) bird\n(B) book" }, { "from": "gpt", "value": "(A) bird" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261288_15846666695166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of picture frame (annotated by the red box) in reference to bed?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458703_136722467057666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, screen door (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) screen door\n(B) picture frame" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261486_41820870614625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, book (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) book\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663349_91032801259666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from flower (highlighted by a red box)? floral arrangement (highlighted by a blue box) or counter (highlighted by a green box)?\n(A) floral arrangement\n(B) counter" }, { "from": "gpt", "value": "(A) floral arrangement" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828507_102517366792166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) cabinetry\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663322_77599669302833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from electric outlet (highlighted by a red box)? Select from candle holder (highlighted by a blue box) and bathroom cabinet (highlighted by a green box).\n(A) candle holder\n(B) bathroom cabinet" }, { "from": "gpt", "value": "(B) bathroom cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334934_663301596346833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333803_51404540673750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from screen door (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or book (highlighted by a green box).\n(A) chair\n(B) book" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828552_101544712599666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to footwear (highlighted by a red box)? Select from bath towel (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) bath towel\n(B) cabinetry" }, { "from": "gpt", "value": "(A) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458772_142313238821041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, luggage (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) luggage\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649440_12639544559583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to clothing (highlighted by a red box)? Choose from door (highlighted by a blue box) and closet (highlighted by a green box).\n(A) door\n(B) closet" }, { "from": "gpt", "value": "(B) closet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445834_68129677990957_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333875_76100071787166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, toy (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) toy\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458337_102864722129875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895623_470807442393250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the cleaning product (highlighted by a red box)? porcelain (highlighted by a blue box) or sink (highlighted by a green box).\n(A) porcelain\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332158_260151229150583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) furniture\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445047_1885740278083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, person (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) person\n(B) armchair" }, { "from": "gpt", "value": "(B) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261681_3602747248000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from studio couch (highlighted by a red box)? star (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) star\n(B) pillow" }, { "from": "gpt", "value": "(A) star" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358117_62360084322291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to kitchen appliance (highlighted by a red box)? sink (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) sink\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458621_127084371690500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toilet paper (highlighted by a red box)? toilet paper (highlighted by a blue box) or window sill (highlighted by a green box).\n(A) toilet paper\n(B) window sill" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018833_649155958872791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from book (highlighted by a red box)? Choose from paperback book (highlighted by a blue box) and paperback book (highlighted by a green box).\n(A) paperback book\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332389_398717121594375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, television (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) television\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898653_573063928063458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204330_14281807615375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bed (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) bed\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896009_137122264695625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, studio couch (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) studio couch\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430221_180213398380333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, stationery (highlighted by a red box) or mousepad (highlighted by a blue box)?\n(A) stationery\n(B) mousepad" }, { "from": "gpt", "value": "(A) stationery" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796590_17466475792500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, ceramic tile (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) ceramic tile\n(B) bath mat" }, { "from": "gpt", "value": "(A) ceramic tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332473_886622173820333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331431_545936918673165_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from toy (highlighted by a red box)? toy (highlighted by a blue box) or teddy bear (highlighted by a green box)?\n(A) toy\n(B) teddy bear" }, { "from": "gpt", "value": "(B) teddy bear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334920_1091069894912625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to mirror (highlighted by a red box)? door handle (highlighted by a blue box) or light fixture (highlighted by a green box).\n(A) door handle\n(B) light fixture" }, { "from": "gpt", "value": "(A) door handle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897728_114230440104375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from furniture (highlighted by a red box)? Select from bay window (highlighted by a blue box) and television (highlighted by a green box).\n(A) bay window\n(B) television" }, { "from": "gpt", "value": "(A) bay window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261331_24080929054041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from toilet (highlighted by a red box)? Choose among these: bathtub (highlighted by a blue box) or basket (highlighted by a green box).\n(A) bathtub\n(B) basket" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_408934302454291_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332400_405824764296250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the beach towel (highlighted by a red box)? Choose among these: countertop (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) countertop\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115401_3195773697375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to chair (highlighted by a red box)? Select from computer monitor (highlighted by a blue box) and computer keyboard (highlighted by a green box).\n(A) computer monitor\n(B) computer keyboard" }, { "from": "gpt", "value": "(B) computer keyboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333325_29489823795375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from garment (highlighted by a red box)? blanket (highlighted by a blue box) or blanket (highlighted by a green box)?\n(A) blanket\n(B) blanket" }, { "from": "gpt", "value": "(A) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670346_66316500401166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) picture frame\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662882_16721490305500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from table (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and candle holder (highlighted by a green box).\n(A) picture frame\n(B) candle holder" }, { "from": "gpt", "value": "(B) candle holder" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204362_15655135453875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the chair (highlighted by a red box)? Choose among these: glass door (highlighted by a blue box) or chair (highlighted by a green box).\n(A) glass door\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333462_57400668514916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, television (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) television\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358105_61835497481375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from screen door (highlighted by a red box)? Choose from chair (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) chair\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332022_202521098629791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bottle (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) bottle\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445173_8147934555791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to window (highlighted by a red box)? Choose from table lamp (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) table lamp\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333836_53924172074708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, blanket (highlighted by a red box) or fabric (highlighted by a blue box)?\n(A) blanket\n(B) fabric" }, { "from": "gpt", "value": "(A) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897973_216821855345166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, electric outlet (highlighted by a red box) or waste container (highlighted by a blue box)?\n(A) electric outlet\n(B) waste container" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895994_136243214592625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from picture frame (highlighted by a red box)? Choose from remote control (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) remote control\n(B) picture frame" }, { "from": "gpt", "value": "(A) remote control" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333803_51390546360291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to book (highlighted by a red box)? Select from book (highlighted by a blue box) and book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446466_355466452800000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to dog bed (highlighted by a red box)? furniture (highlighted by a blue box) or furniture (highlighted by a green box).\n(A) furniture\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458503_113283976241708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to pillow (highlighted by a red box)? Choose from studio couch (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897822_132844290981875_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354735028557833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from pillow (highlighted by a red box)? Choose from lamp (highlighted by a blue box) and cabinet (highlighted by a green box).\n(A) lamp\n(B) cabinet" }, { "from": "gpt", "value": "(B) cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115197_105560760033416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, furniture (highlighted by a red box) or door (highlighted by a blue box)?\n(A) furniture\n(B) door" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897945_351510714722083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from studio couch (highlighted by a red box)? coffee cup (highlighted by a blue box) or coffee table (highlighted by a green box)?\n(A) coffee cup\n(B) coffee table" }, { "from": "gpt", "value": "(A) coffee cup" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445444_149646015016333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, sink (highlighted by a red box) or shower (highlighted by a blue box)?\n(A) sink\n(B) shower" }, { "from": "gpt", "value": "(B) shower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662882_16667494999875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) chair\n(B) mat" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332950_20694123305916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, toy (highlighted by a red box) or comic book (highlighted by a blue box)?\n(A) toy\n(B) comic book" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898254_696730031431333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, electric outlet (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) electric outlet\n(B) lamp" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897939_351232812872500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of furniture (annotated by the red box) in relation to chair? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333480_60185702857000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to bath (highlighted by a red box), shopping cart (highlighted by a blue box) or clothing (highlighted by a green box)?\n(A) shopping cart\n(B) clothing" }, { "from": "gpt", "value": "(A) shopping cart" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669896_11098705224958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to chair (highlighted by a red box)? blanket (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) blanket\n(B) studio couch" }, { "from": "gpt", "value": "(A) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895908_110734946680666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from lamp (highlighted by a red box)? lamp (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) lamp\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261555_75419167239125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the lamp (highlighted by a red box)? Choose among these: power outlet (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) power outlet\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895448_129459087843875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from toilet paper (highlighted by a red box)? picnic basket (highlighted by a blue box) or toilet paper (highlighted by a green box)?\n(A) picnic basket\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670201_53354609922083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the pillow (highlighted by a red box)? studio couch (highlighted by a blue box) or table lamp (highlighted by a green box).\n(A) studio couch\n(B) table lamp" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896176_141433645591041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, furniture (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) furniture\n(B) electric outlet" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333864_75481549410458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, towel (highlighted by a red box) or towel (highlighted by a blue box)?\n(A) towel\n(B) towel" }, { "from": "gpt", "value": "(A) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332207_264657374263916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, baby carriage (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) baby carriage\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358645_3211430652250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from coffee cup (highlighted by a red box)? bowl (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) bowl\n(B) chair" }, { "from": "gpt", "value": "(A) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333016_130039302992416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to book (highlighted by a red box)? book (highlighted by a blue box) or book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430439_1072461206000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toy (highlighted by a red box) or glass jar (highlighted by a blue box)?\n(A) toy\n(B) glass jar" }, { "from": "gpt", "value": "(B) glass jar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334890_623275948134125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to clothing (highlighted by a red box)? Select from clock (highlighted by a blue box) and clothing (highlighted by a green box).\n(A) clock\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445206_10657927400333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window sill (highlighted by a red box), basket (highlighted by a blue box) or entertainment center (highlighted by a green box)?\n(A) basket\n(B) entertainment center" }, { "from": "gpt", "value": "(A) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430442_774448361041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bottle (highlighted by a red box) or apple (highlighted by a blue box)?\n(A) bottle\n(B) apple" }, { "from": "gpt", "value": "(B) apple" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204474_25025577017583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to paper plate (highlighted by a red box), studio couch (highlighted by a blue box) or coffee table (highlighted by a green box)?\n(A) studio couch\n(B) coffee table" }, { "from": "gpt", "value": "(B) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017962_455972212050375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897490_471154230612416_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828272_84490783801958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, appliance (highlighted by a red box) or door (highlighted by a blue box)?\n(A) appliance\n(B) door" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430441_824261575625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, paper towel (highlighted by a red box) or tea pot (highlighted by a blue box)?\n(A) paper towel\n(B) tea pot" }, { "from": "gpt", "value": "(A) paper towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429756_356867761218833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) chair\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358345_15184823417958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to sink (highlighted by a red box)? Select from countertop (highlighted by a blue box) and lamp (highlighted by a green box).\n(A) countertop\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444793_51539376030875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from toilet paper (highlighted by a red box)? Select from screen door (highlighted by a blue box) and toilet bowl (highlighted by a green box).\n(A) screen door\n(B) toilet bowl" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739276_42757472676750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to chair (highlighted by a red box)? Select from floral arrangement (highlighted by a blue box) and chair (highlighted by a green box).\n(A) floral arrangement\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896031_129153841608791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from window (highlighted by a red box)? Choose from curtain (highlighted by a blue box) and paperback book (highlighted by a green box).\n(A) curtain\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739933_16662809024957_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toilet (highlighted by a red box) or soap (highlighted by a blue box)?\n(A) toilet\n(B) soap" }, { "from": "gpt", "value": "(B) soap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895904_110629340458291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the book (highlighted by a red box)? Choose among these: dot (highlighted by a blue box) or book (highlighted by a green box).\n(A) dot\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898689_577270711574291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, sink (highlighted by a red box) or toilet (highlighted by a blue box)?\n(A) sink\n(B) toilet" }, { "from": "gpt", "value": "(B) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333040_59700754159416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from paper towel (highlighted by a red box), cleaning product (highlighted by a blue box) or soap (highlighted by a green box)?\n(A) cleaning product\n(B) soap" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663415_95878879744166_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358620_616313604666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, footwear (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) footwear\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115299_119617129014291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, table (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) table\n(B) picture frame" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446466_355464453615208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or table (highlighted by a blue box)?\n(A) table\n(B) table" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358263_7271851136541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358257_6820877619666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of porcelain (annotated by the red box) in relation to waste container?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898651_572719021411333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) picture frame\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670016_30435993862125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: design (highlighted by a blue box) or table lamp (highlighted by a green box).\n(A) design\n(B) table lamp" }, { "from": "gpt", "value": "(A) design" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899970_632361019750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, studio couch (highlighted by a red box) or equipment (highlighted by a blue box)?\n(A) studio couch\n(B) equipment" }, { "from": "gpt", "value": "(B) equipment" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895796_680711398161250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) chair\n(B) furniture" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895960_133577865160666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, stool (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) stool\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897455_469659472851208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the curtain (highlighted by a red box)? Choose among these: tableware (highlighted by a blue box) or person (highlighted by a green box).\n(A) tableware\n(B) person" }, { "from": "gpt", "value": "(B) person" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115504_12264311749250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333288_25277828971000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to bed (highlighted by a red box)? picture frame (highlighted by a blue box) or toy (highlighted by a green box).\n(A) picture frame\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334665_390786282714541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to table (highlighted by a red box), bookcase (highlighted by a blue box) or book (highlighted by a green box)?\n(A) bookcase\n(B) book" }, { "from": "gpt", "value": "(A) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445997_133907460662541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to tap (highlighted by a red box)? Select from appliance (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446485_355938343253541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from furniture (highlighted by a red box), sculpture (highlighted by a blue box) or swivel chair (highlighted by a green box)?\n(A) sculpture\n(B) swivel chair" }, { "from": "gpt", "value": "(A) sculpture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458690_135424785547915_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899209_186679377539291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, electric outlet (highlighted by a red box) or table (highlighted by a blue box)?\n(A) electric outlet\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333873_76243380412750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the footwear (highlighted by a red box)? furniture (highlighted by a blue box) or swivel chair (highlighted by a green box).\n(A) furniture\n(B) swivel chair" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331491_153207622476416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the glass door (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or bath towel (highlighted by a green box).\n(A) door\n(B) bath towel" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895987_136365613668290_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, lamp (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) lamp\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895793_680518592913958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the armchair (highlighted by a red box)? curtain (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) curtain\n(B) houseplant" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663368_92553498388916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bronze statue (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) bronze statue\n(B) window sill" }, { "from": "gpt", "value": "(A) bronze statue" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739629_1912264203291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, equipment (highlighted by a red box) or file cabinet (highlighted by a blue box)?\n(A) equipment\n(B) file cabinet" }, { "from": "gpt", "value": "(A) equipment" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333812_52249158753291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chest of drawers (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) chest of drawers\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358105_61807492399833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of furniture (annotated by the red box) in relation to blanket? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430776_338942344409125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of washing machine (annotated by the red box) in relation to bath?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24401802351458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to refrigerator (highlighted by a red box)? chair (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) chair\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204730_23444619535291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to picture frame (highlighted by a red box)? window (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458549_127583533777500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the pillow (highlighted by a red box)? pillow (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737938734935000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to lamp (highlighted by a red box), studio couch (highlighted by a blue box) or plant (highlighted by a green box)?\n(A) studio couch\n(B) plant" }, { "from": "gpt", "value": "(B) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445639_58324769746916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table lamp (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) table lamp\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332201_264392081979333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: lamp (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) lamp\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331281_14164596738916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from screen door (highlighted by a red box)? light fixture (highlighted by a blue box) or mirror (highlighted by a green box)?\n(A) light fixture\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018286_799461522748791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) door\n(B) picture frame" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446495_357726535494333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bath (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) bath\n(B) cleaning product" }, { "from": "gpt", "value": "(A) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204451_22975170113625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window screen (highlighted by a red box), chair (highlighted by a blue box) or table (highlighted by a green box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_408938300801000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to screen door (highlighted by a red box)? Select from window screen (highlighted by a blue box) and chair (highlighted by a green box).\n(A) window screen\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895635_471823889937333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, home appliance (highlighted by a red box) or speaker (highlighted by a blue box)?\n(A) home appliance\n(B) speaker" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429835_748727924208833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) window\n(B) houseplant" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649807_46799382344625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, stool (highlighted by a red box) or plain (highlighted by a blue box)?\n(A) stool\n(B) plain" }, { "from": "gpt", "value": "(B) plain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430248_182383279205041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to book (highlighted by a red box)? Choose from book (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) book\n(B) curtain" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333525_50353200603500_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458688_9217492384875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the studio couch (highlighted by a red box)? window screen (highlighted by a blue box) or door (highlighted by a green box).\n(A) window screen\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897643_146916178300958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445695_57400291156208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from home appliance (highlighted by a red box), appliance (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204791_24172330790375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446446_82460119275083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, wood burning stove (highlighted by a red box) or table (highlighted by a blue box)?\n(A) wood burning stove\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115628_3415096697916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window (highlighted by a red box), door (highlighted by a blue box) or table (highlighted by a green box)?\n(A) door\n(B) table" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331346_192290511022500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from window (highlighted by a red box)? curtain (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) curtain\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261294_16266831151291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from picture frame (highlighted by a red box)? Choose from radiator (highlighted by a blue box) and shelf (highlighted by a green box).\n(A) radiator\n(B) shelf" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333288_25285825727000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from flower (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334961_667567285163791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to counter top (highlighted by a red box)? paperback book (highlighted by a blue box) or book (highlighted by a green box).\n(A) paperback book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115412_4250759815415_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261339_23901437301541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, coffee machine (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) coffee machine\n(B) sink" }, { "from": "gpt", "value": "(A) coffee machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649727_49013317722916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhere is chest of drawers (annotated by the red box) located in relation to table in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333031_59060922771083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, pillow (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) pillow\n(B) clothing" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115216_95031229444291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window screen (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) window screen\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333787_48820172936208_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358111_61643893400375_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896074_132752311149499_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, vanity (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) vanity\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333055_60278995131416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the table (highlighted by a red box)? houseplant (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444924_220985336345500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, shower curtain (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) shower curtain\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897643_146950181255500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to clothing (highlighted by a red box)? Choose from chair (highlighted by a blue box) and chest of drawers (highlighted by a green box).\n(A) chair\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896209_2200176418500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or kitchen & dining room table (highlighted by a blue box)?\n(A) picture frame\n(B) kitchen & dining room table" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333475_58608243585041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bed frame (highlighted by a red box)? Choose among these: throw pillow (highlighted by a blue box) or bean bag chair (highlighted by a green box).\n(A) throw pillow\n(B) bean bag chair" }, { "from": "gpt", "value": "(A) throw pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334037_278648014809166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to shelf (highlighted by a red box)? bottle (highlighted by a blue box) or book (highlighted by a green box).\n(A) bottle\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331399_200331601326916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, map (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) map\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331498_153788312950166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to bathroom cabinet (highlighted by a red box)? mouthwash (highlighted by a blue box) or cleaning product (highlighted by a green box).\n(A) mouthwash\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332778_44586045942708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from appliance (highlighted by a red box)? Choose from houseplant (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) houseplant\n(B) appliance" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458626_127668290884833_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430248_182347277114791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670116_41783680395000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or picnic basket (highlighted by a blue box)?\n(A) cabinetry\n(B) picnic basket" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358324_18847679818000_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444696_72498777200125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from bay window (highlighted by a red box), parking sign (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) parking sign\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896103_145322908325166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, studio couch (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) studio couch\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897655_147119379581791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, window (highlighted by a red box) or table (highlighted by a blue box)?\n(A) window\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895184_37858571526541_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828340_78867430195708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from computer monitor (highlighted by a red box)? bulletin board (highlighted by a blue box) or computer monitor (highlighted by a green box)?\n(A) bulletin board\n(B) computer monitor" }, { "from": "gpt", "value": "(A) bulletin board" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333308_28085351076166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from radiator (highlighted by a red box)? cabinetry (highlighted by a blue box) or vase (highlighted by a green box)?\n(A) cabinetry\n(B) vase" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445079_5535326563500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, infant bed (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) infant bed\n(B) toy" }, { "from": "gpt", "value": "(A) infant bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018829_647482571452541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to studio couch (highlighted by a red box)? pillow (highlighted by a blue box) or mat (highlighted by a green box).\n(A) pillow\n(B) mat" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204305_15308270274458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444574_31885806181041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the door (highlighted by a red box)? Choose among these: furniture (highlighted by a blue box) or chair (highlighted by a green box).\n(A) furniture\n(B) chair" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898391_369476418068041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from chest of drawers (highlighted by a red box)? Choose among these: bed (highlighted by a blue box) or cardboard box (highlighted by a green box).\n(A) bed\n(B) cardboard box" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669927_14264966971375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, keyboard (highlighted by a red box) or computer monitor (highlighted by a blue box)?\n(A) keyboard\n(B) computer monitor" }, { "from": "gpt", "value": "(A) keyboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331089_133736178105375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, storage box (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) storage box\n(B) footwear" }, { "from": "gpt", "value": "(A) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358386_19246743145208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, mat (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) mat\n(B) pillow" }, { "from": "gpt", "value": "(A) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358289_15923747215958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from chair (highlighted by a red box)? Choose among these: bottle (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898189_145068429754000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or door (highlighted by a blue box)?\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896249_7561586835083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from screen door (highlighted by a red box), shelf (highlighted by a blue box) or sheet (highlighted by a green box)?\n(A) shelf\n(B) sheet" }, { "from": "gpt", "value": "(B) sheet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649474_14681729585750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739425_191762302646125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bath towel (highlighted by a red box)? Choose from mirror (highlighted by a blue box) and soap dispenser (highlighted by a green box).\n(A) mirror\n(B) soap dispenser" }, { "from": "gpt", "value": "(B) soap dispenser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334935_663034887911375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from table (highlighted by a red box)? blanket (highlighted by a blue box) or entertainment center (highlighted by a green box)?\n(A) blanket\n(B) entertainment center" }, { "from": "gpt", "value": "(B) entertainment center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670191_51461032813875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, shelf (highlighted by a red box) or glass box (highlighted by a blue box)?\n(A) shelf\n(B) glass box" }, { "from": "gpt", "value": "(B) glass box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204517_743164025458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, gas stove (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) gas stove\n(B) appliance" }, { "from": "gpt", "value": "(A) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332207_264455073090958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, appliance (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) appliance\n(B) footwear" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331226_282510317030041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to apple (highlighted by a red box)? Select from ceramic tile (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) ceramic tile\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445169_7811235450041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window (highlighted by a red box), curtain (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) curtain\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670048_33438911771583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, toy (highlighted by a red box) or bulletin board (highlighted by a blue box)?\n(A) toy\n(B) bulletin board" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331105_135588973794166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or letter (highlighted by a blue box)?\n(A) door\n(B) letter" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204322_16016059190166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, curtain (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) curtain\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332561_904901068408666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, washing machine (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) washing machine\n(B) bath towel" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333319_28431143268791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, shelf (highlighted by a red box) or glass jar (highlighted by a blue box)?\n(A) shelf\n(B) glass jar" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796568_16181681065500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, television (highlighted by a red box) or speaker (highlighted by a blue box)?\n(A) television\n(B) speaker" }, { "from": "gpt", "value": "(B) speaker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670122_41714875664208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, pillow (highlighted by a red box) or bag (highlighted by a blue box)?\n(A) pillow\n(B) bag" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896162_139835085755458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from sink (highlighted by a red box)? Choose among these: plant (highlighted by a blue box) or window (highlighted by a green box).\n(A) plant\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444876_99352139117458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, sock (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) sock\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739818_15557648888958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to toilet paper (highlighted by a red box)? Select from tap (highlighted by a blue box) and sink (highlighted by a green box).\n(A) tap\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896160_139920085470916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to toiletry (highlighted by a red box), bath towel (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) bath towel\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334920_1091100899052874_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toilet (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) toilet\n(B) bath mat" }, { "from": "gpt", "value": "(A) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334025_271626796323916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, electric outlet (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) electric outlet\n(B) curtain" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018079_103486313607000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, paperback book (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) paperback book\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446485_355954353359958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table lamp (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430739_336564528855416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the couch (highlighted by a red box)? coffee table (highlighted by a blue box) or box (highlighted by a green box).\n(A) coffee table\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662959_24583488189583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from furniture (highlighted by a red box)? Select from toilet (highlighted by a blue box) and drawer (highlighted by a green box).\n(A) toilet\n(B) drawer" }, { "from": "gpt", "value": "(B) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445583_283741367004041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bed (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) bed\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334040_278926918101208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896378_20323350808916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to curtain (highlighted by a red box)? Choose from chest of drawers (highlighted by a blue box) and electric outlet (highlighted by a green box).\n(A) chest of drawers\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796744_28906070438416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) picture frame\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333801_51181547853375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from shelf (highlighted by a red box)? book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458706_136780060908749_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of cabinetry (annotated by the red box) in relation to vent?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445684_61843667793416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, christmas decoration (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) christmas decoration\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115384_1751581216208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from radiator (highlighted by a red box)? Select from window (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) window\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115201_94442136820166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, screen door (highlighted by a red box) or nightstand (highlighted by a blue box)?\n(A) screen door\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204858_1622824811375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796443_743408668250_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669854_12683450890333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, desktop computer (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) desktop computer\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898621_758036307190291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to glass door (highlighted by a red box)? Choose from cardboard (highlighted by a blue box) and copy (highlighted by a green box).\n(A) cardboard\n(B) copy" }, { "from": "gpt", "value": "(B) copy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895298_91159129141916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from chair (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or chair (highlighted by a green box).\n(A) pillow\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663397_95078895621083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to window (highlighted by a red box)? Choose from bottle (highlighted by a blue box) and table lamp (highlighted by a green box).\n(A) bottle\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895465_130591212515875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from kitchen appliance (highlighted by a red box)? Choose among these: plate (highlighted by a blue box) or countertop (highlighted by a green box).\n(A) plate\n(B) countertop" }, { "from": "gpt", "value": "(A) plate" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739686_1023341860708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) window\n(B) table lamp" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899899_1026853431970541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table lamp (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796505_3406408956500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window frame (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) window frame\n(B) radiator" }, { "from": "gpt", "value": "(A) window frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358167_60907933992708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, studio couch (highlighted by a red box) or table (highlighted by a blue box)?\n(A) studio couch\n(B) table" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670340_66249893418291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or door (highlighted by a blue box)?\n(A) chair\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898235_695708506305208_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670008_30357591552083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) chair\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429826_746650800294416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, houseplant (highlighted by a red box) or bath (highlighted by a blue box)?\n(A) houseplant\n(B) bath" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204757_26718407520541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, screen door (highlighted by a red box) or table (highlighted by a blue box)?\n(A) screen door\n(B) table" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115504_12320306269833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from furniture (highlighted by a red box)? bowling ball (highlighted by a blue box) or bowling ball (highlighted by a green box)?\n(A) bowling ball\n(B) bowling ball" }, { "from": "gpt", "value": "(A) bowling ball" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670271_66586419930082_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) cabinetry\n(B) electric outlet" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333828_53337451288833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhere is clothing (annotated by the red box) located in relation to clothing in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332990_125281297656416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of picture frame (annotated by the red box) and picture frame in the image provided, where is picture frame (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899232_880562135901291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, lamp (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332080_251435832865083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bath mat (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) bath mat\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458548_127520126795250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to studio couch (highlighted by a red box)? Choose from laundry (highlighted by a blue box) and remote (highlighted by a green box).\n(A) laundry\n(B) remote" }, { "from": "gpt", "value": "(B) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445135_5476532095166_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115412_4226752651666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) picture frame\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261203_11578982307750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, armchair (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) armchair\n(B) armchair" }, { "from": "gpt", "value": "(B) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429884_367768133156083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to radiator (highlighted by a red box), window sill (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) window sill\n(B) curtain" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334967_669363385709083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from door (highlighted by a red box)? corridor (highlighted by a blue box) or desk (highlighted by a green box)?\n(A) corridor\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670208_54155658078208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) picture frame\n(B) studio couch" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429739_20042072354250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to shelf (highlighted by a red box)? Choose from comic book (highlighted by a blue box) and shelf (highlighted by a green box).\n(A) comic book\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_408976901505833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window screen (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) window screen\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018098_367367300422625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of curtain (annotated by the red box) and curtain in the image provided, where is curtain (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333806_51227945708833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from book (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828368_92209625768708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cooker (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) cooker\n(B) chair" }, { "from": "gpt", "value": "(A) cooker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331053_482516014646916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from shelf (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) picture frame\n(B) electric outlet" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333000_128237406350500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, desk (highlighted by a red box) or coffee cup (highlighted by a blue box)?\n(A) desk\n(B) coffee cup" }, { "from": "gpt", "value": "(B) coffee cup" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354649030434083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, desk (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) desk\n(B) radiator" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429884_367824127170666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the round table (highlighted by a red box)? round table (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) round table\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018746_7294754059166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, appliance (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) appliance\n(B) radiator" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895895_109444117247166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, sink (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) sink\n(B) screen door" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897480_470977420373208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898785_67323113644916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bookshelf (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) bookshelf\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333574_207503836736791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to food (highlighted by a red box)? Choose from window (highlighted by a blue box) and heater (highlighted by a green box).\n(A) window\n(B) heater" }, { "from": "gpt", "value": "(B) heater" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334027_273606015297416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) door\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444762_81587470889708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, radiator (highlighted by a red box) or heater (highlighted by a blue box)?\n(A) radiator\n(B) heater" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898358_511596579583458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to studio couch (highlighted by a red box)? Select from window (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796584_17383476806208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, houseplant (highlighted by a red box) or tile (highlighted by a blue box)?\n(A) houseplant\n(B) tile" }, { "from": "gpt", "value": "(B) tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649603_35957609531500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: air conditioner (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) air conditioner\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018340_117242808817000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from cabinetry (highlighted by a red box)? Select from shelf (highlighted by a blue box) and toy (highlighted by a green box).\n(A) shelf\n(B) toy" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897523_472478997805291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bottle (highlighted by a red box) or storage box (highlighted by a blue box)?\n(A) bottle\n(B) storage box" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332397_401450515197333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, studio couch (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) studio couch\n(B) glass door" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445784_64781353305333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) window\n(B) houseplant" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332398_401531415595833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or home appliance (highlighted by a green box).\n(A) cabinetry\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737956727657833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to fireplace (highlighted by a red box)? Select from window (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828334_79029132891333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from glass door (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204887_807675671166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from screen door (highlighted by a red box)? appliance (highlighted by a blue box) or home appliance (highlighted by a green box)?\n(A) appliance\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430293_187324248932000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from chest of drawers (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896176_141465832862291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896524_34640729109916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, basket (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) basket\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430402_126560395583791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhere is kitchen appliance (annotated by the red box) located in relation to coffee cup in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332072_249943090423458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, countertop (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) countertop\n(B) appliance" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739821_16256184181708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, mat (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) mat\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897745_115957765646125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, soap dispenser (highlighted by a red box) or lighting (highlighted by a blue box)?\n(A) soap dispenser\n(B) lighting" }, { "from": "gpt", "value": "(B) lighting" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358117_62326098392958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from sink (highlighted by a red box)? Select from kitchen appliance (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) kitchen appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828334_79065135321291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from table (highlighted by a red box)? Select from table (highlighted by a blue box) and fireplace (highlighted by a green box).\n(A) table\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828593_104106064295208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, book (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) book\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018833_649145962915416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of bed (annotated by the red box) in relation to stairwell? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897712_112141290866416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bottle (highlighted by a red box) or window (highlighted by a blue box)?\n(A) bottle\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897587_134973348330625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from doormat (highlighted by a red box)? Choose from chair (highlighted by a blue box) and door (highlighted by a green box).\n(A) chair\n(B) door" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429694_11270096724000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, book (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) book\n(B) shelf" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358731_6715829091333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from door (highlighted by a red box)? Select from blanket (highlighted by a blue box) and furniture (highlighted by a green box).\n(A) blanket\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333477_60236499021291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the toothbrush (highlighted by a red box)? refrigerator (highlighted by a blue box) or light switch (highlighted by a green box).\n(A) refrigerator\n(B) light switch" }, { "from": "gpt", "value": "(B) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898903_817206038524208_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898720_582951674920041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, screen door (highlighted by a red box) or light switch (highlighted by a blue box)?\n(A) screen door\n(B) light switch" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358407_40575669181458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bottle (highlighted by a red box)? Choose among these: teapot (highlighted by a blue box) or coffee cup (highlighted by a green box).\n(A) teapot\n(B) coffee cup" }, { "from": "gpt", "value": "(A) teapot" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204522_1508777650458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the picture frame (highlighted by a red box)? picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261164_751902532000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from pillow (highlighted by a red box)? Select from magazine (highlighted by a blue box) and studio couch (highlighted by a green box).\n(A) magazine\n(B) studio couch" }, { "from": "gpt", "value": "(A) magazine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204381_18137921363291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, lamp (highlighted by a red box) or board game (highlighted by a blue box)?\n(A) lamp\n(B) board game" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332991_125373693658250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toy (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) toy\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115573_2628102885375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, box (highlighted by a red box) or box (highlighted by a blue box)?\n(A) box\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204335_15026302652625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, window (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) window\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895653_368635567595166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), light switch (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) light switch\n(B) furniture" }, { "from": "gpt", "value": "(A) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896177_141354743454833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, shop window (highlighted by a red box) or tortoise (highlighted by a blue box)?\n(A) shop window\n(B) tortoise" }, { "from": "gpt", "value": "(A) shop window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895446_129384884778250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to washing machine (highlighted by a red box)? sink (highlighted by a blue box) or clothing (highlighted by a green box).\n(A) sink\n(B) clothing" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896066_131830987025208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from cabinetry (highlighted by a red box), food (highlighted by a blue box) or table (highlighted by a green box)?\n(A) food\n(B) table" }, { "from": "gpt", "value": "(A) food" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_409038909177958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to appliance (highlighted by a red box)? power outlet (highlighted by a blue box) or toy (highlighted by a green box).\n(A) power outlet\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358645_3219427341000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to cabinetry (highlighted by a red box)? Select from kitchen appliance (highlighted by a blue box) and paper towel (highlighted by a green box).\n(A) kitchen appliance\n(B) paper towel" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739846_17120425703083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of curtain (annotated by the red box) in relation to window? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446445_354370527629166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332469_886509269420083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to studio couch (highlighted by a red box), door (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) door\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898448_3300378952666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) window\n(B) toiletry" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796709_27465086119416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or window (highlighted by a blue box)?\n(A) chair\n(B) window" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895626_470702035120000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, pipe (highlighted by a red box) or pipe (highlighted by a blue box)?\n(A) pipe\n(B) pipe" }, { "from": "gpt", "value": "(B) pipe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115132_85615042836625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from porcelain (highlighted by a red box)? Choose among these: toilet bowl (highlighted by a blue box) or sink (highlighted by a green box).\n(A) toilet bowl\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895826_1219989676288083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from screen door (highlighted by a red box)? curtain (highlighted by a blue box) or counter top (highlighted by a green box)?\n(A) curtain\n(B) counter top" }, { "from": "gpt", "value": "(B) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896429_19292548889708_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333168_44176968112500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, desk (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) desk\n(B) cabinetry" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895865_107715064016583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to mat (highlighted by a red box)? Select from mirror (highlighted by a blue box) and chair (highlighted by a green box).\n(A) mirror\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018608_633212506004708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from drawer (highlighted by a red box)? Select from chair (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) chair\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897798_131206109195125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to cabinetry (highlighted by a red box), cabinetry (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898899_816946744611583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, kitchen appliance (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) kitchen appliance\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333325_29581419736541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, nightstand (highlighted by a red box) or tablecloth (highlighted by a blue box)?\n(A) nightstand\n(B) tablecloth" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444748_79560067222875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, electric outlet (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) electric outlet\n(B) bottle" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898695_581129986885583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from mat (highlighted by a red box)? desk (highlighted by a blue box) or coffee table (highlighted by a green box)?\n(A) desk\n(B) coffee table" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899975_814670365000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: bookcase (highlighted by a blue box) or book (highlighted by a green box).\n(A) bookcase\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670028_32354502250083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, desk (highlighted by a red box) or food (highlighted by a blue box)?\n(A) desk\n(B) food" }, { "from": "gpt", "value": "(B) food" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333673_134089761287625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, clothing (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) clothing\n(B) clothing" }, { "from": "gpt", "value": "(A) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895491_450896056189375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) chair\n(B) desk" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333264_21807810463833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bottle (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) bottle\n(B) cabinetry" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334733_535837423666958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, throw pillow (highlighted by a red box) or dog bed (highlighted by a blue box)?\n(A) throw pillow\n(B) dog bed" }, { "from": "gpt", "value": "(A) throw pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739850_17221717024916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from curtain (highlighted by a red box)? table lamp (highlighted by a blue box) or chest of drawers (highlighted by a green box)?\n(A) table lamp\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334040_278879020919749_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) cabinetry\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649798_46128514432208_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895910_110849432458291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, nightstand (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332482_338662302172041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or turquoise (highlighted by a blue box)?\n(A) furniture\n(B) turquoise" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446444_82573007951291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from fireplace (highlighted by a red box)? Choose among these: star (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) star\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796237_2990226716041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chest of drawers (highlighted by a red box) or medicine cabinet (highlighted by a blue box)?\n(A) chest of drawers\n(B) medicine cabinet" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828328_77676568188041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is curtain (annotated by the red box) located relative to curtain?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445684_61867657785250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toy (highlighted by a red box) or coffee table (highlighted by a blue box)?\n(A) toy\n(B) coffee table" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24478504253416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to window (highlighted by a red box)? Select from couch (highlighted by a blue box) and drawer (highlighted by a green box).\n(A) couch\n(B) drawer" }, { "from": "gpt", "value": "(A) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796721_27379886489208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cabinetry (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) cabinetry\n(B) screen door" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897757_117737222241083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to art (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430855_74288388121916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to table lamp (highlighted by a red box)? screen door (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) screen door\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897890_344989513881958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332232_755605034859166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, mirror (highlighted by a red box) or exhaust hood (highlighted by a blue box)?\n(A) mirror\n(B) exhaust hood" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429739_20155459406625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898006_219507936524000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to soap dispenser (highlighted by a red box), mirror (highlighted by a blue box) or toilet (highlighted by a green box)?\n(A) mirror\n(B) toilet" }, { "from": "gpt", "value": "(B) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358253_6245043176791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, studio couch (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) studio couch\n(B) table lamp" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333851_74768925817625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from swivel chair (highlighted by a red box)? Choose among these: mat (highlighted by a blue box) or ipad (highlighted by a green box).\n(A) mat\n(B) ipad" }, { "from": "gpt", "value": "(B) ipad" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898596_184403780241375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from clipboard (highlighted by a red box)? Choose from coffee machine (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) coffee machine\n(B) cabinetry" }, { "from": "gpt", "value": "(A) coffee machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430388_125139298314000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from radiator (highlighted by a red box)? Choose from houseplant (highlighted by a blue box) and table (highlighted by a green box).\n(A) houseplant\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897633_139639855212416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from door (highlighted by a red box), screen door (highlighted by a blue box) or chest of drawers (highlighted by a green box)?\n(A) screen door\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670350_67458582929375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, glass door (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) glass door\n(B) curtain" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333806_51350445985666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, book (highlighted by a red box) or cabinet (highlighted by a blue box)?\n(A) book\n(B) cabinet" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204275_12628470720458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to faucet (highlighted by a red box), window (highlighted by a blue box) or sink (highlighted by a green box)?\n(A) window\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332184_262602621923375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from infant bed (highlighted by a red box)? Choose among these: linen (highlighted by a blue box) or luggage (highlighted by a green box).\n(A) linen\n(B) luggage" }, { "from": "gpt", "value": "(B) luggage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895587_1160137036796833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) picture frame\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430809_64094599905458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) table\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796191_482725188291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is nightstand (annotated by the red box) located relative to clock? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445955_129962240271291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of studio couch (annotated by the red box) and table in the image provided, where is studio couch (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895587_1160170439916583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from pillow (highlighted by a red box)? houseplant (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) houseplant\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204481_24846681261833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) cabinetry\n(B) window sill" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796579_16776177820624_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to fireplace (highlighted by a red box)? mirror (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) mirror\n(B) cabinetry" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429720_18078648598875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from paper towel (highlighted by a red box), cabinetry (highlighted by a blue box) or glass jar (highlighted by a green box)?\n(A) cabinetry\n(B) glass jar" }, { "from": "gpt", "value": "(B) glass jar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898203_145841378198375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from chair (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or table lamp (highlighted by a green box).\n(A) chair\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333847_75034218381500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from pillow (highlighted by a red box)? pillow (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899574_959630333123666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to oven (highlighted by a red box), drawer (highlighted by a blue box) or glass door (highlighted by a green box)?\n(A) drawer\n(B) glass door" }, { "from": "gpt", "value": "(A) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828307_76288738513166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or window (highlighted by a blue box)?\n(A) door\n(B) window" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445834_68177692312000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, candle holder (highlighted by a red box) or robe (highlighted by a blue box)?\n(A) candle holder\n(B) robe" }, { "from": "gpt", "value": "(A) candle holder" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333657_130183772992583_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445721_63593903895916_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358645_3262226287625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from mug (highlighted by a red box)? Choose among these: scissors (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) scissors\n(B) appliance" }, { "from": "gpt", "value": "(A) scissors" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430248_182379280824750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, shelf (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) shelf\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445169_7815233844958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, rope (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) rope\n(B) radiator" }, { "from": "gpt", "value": "(A) rope" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332774_44415348380916_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895653_368635567595166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, light switch (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) light switch\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458688_9225489062125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, couch (highlighted by a red box) or glass plate (highlighted by a blue box)?\n(A) couch\n(B) glass plate" }, { "from": "gpt", "value": "(A) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018608_633226516936833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or coffee table (highlighted by a blue box)?\n(A) chair\n(B) coffee table" }, { "from": "gpt", "value": "(B) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898710_581488813341333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) door\n(B) curtain" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897776_128876228100666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or light (highlighted by a blue box)?\n(A) door\n(B) light" }, { "from": "gpt", "value": "(B) light" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430221_180239404547041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to cabinetry (highlighted by a red box)? Select from screen door (highlighted by a blue box) and door (highlighted by a green box).\n(A) screen door\n(B) door" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204449_23032980583875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from window sill (highlighted by a red box)? radiator (highlighted by a blue box) or speaker (highlighted by a green box)?\n(A) radiator\n(B) speaker" }, { "from": "gpt", "value": "(B) speaker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445938_79466560869708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from radiator (highlighted by a red box)? cabinetry (highlighted by a blue box) or debris (highlighted by a green box)?\n(A) cabinetry\n(B) debris" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899563_958919722930125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from studio couch (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898696_580853684266375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or trash bin/can (highlighted by a blue box)?\n(A) cabinetry\n(B) trash bin/can" }, { "from": "gpt", "value": "(B) trash bin/can" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333168_44156876253333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from sink (highlighted by a red box)? kettle (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) kettle\n(B) appliance" }, { "from": "gpt", "value": "(A) kettle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333873_76307371111166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or wide (highlighted by a blue box)?\n(A) door\n(B) wide" }, { "from": "gpt", "value": "(B) wide" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899653_233586478108208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, letter (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) letter\n(B) furniture" }, { "from": "gpt", "value": "(A) letter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018404_393256886133291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from cleaning product (highlighted by a red box), cleaning product (highlighted by a blue box) or cleaning product (highlighted by a green box)?\n(A) cleaning product\n(B) cleaning product" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447210_209230773098291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to furniture (highlighted by a red box), bottle (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896117_146003621598166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, shelf (highlighted by a red box) or person (highlighted by a blue box)?\n(A) shelf\n(B) person" }, { "from": "gpt", "value": "(B) person" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331277_13226440835041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, book (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) book\n(B) paperback book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447216_212511024426416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from desk (highlighted by a red box)? Select from table (highlighted by a blue box) and cloth (highlighted by a green box).\n(A) table\n(B) cloth" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444735_77903103414375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, book (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) book\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334672_391412103077166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, beverage (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) beverage\n(B) toilet paper" }, { "from": "gpt", "value": "(A) beverage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24413814097791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to chair (highlighted by a red box)? Select from chair (highlighted by a blue box) and flower (highlighted by a green box).\n(A) chair\n(B) flower" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896229_5022499093791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to sink (highlighted by a red box)? Choose from toiletry (highlighted by a blue box) and mouthwash (highlighted by a green box).\n(A) toiletry\n(B) mouthwash" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896494_31435949349083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bay window (highlighted by a red box)? air conditioning (highlighted by a blue box) or window (highlighted by a green box).\n(A) air conditioning\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896527_34742920090665_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from gift basket (highlighted by a red box)? bowl (highlighted by a blue box) or basket (highlighted by a green box)?\n(A) bowl\n(B) basket" }, { "from": "gpt", "value": "(A) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358410_40642674788333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from lamp (highlighted by a red box)? Choose among these: stationery (highlighted by a blue box) or stationery (highlighted by a green box).\n(A) stationery\n(B) stationery" }, { "from": "gpt", "value": "(A) stationery" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896411_16596317534916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cabinetry (highlighted by a red box)? oven (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) oven\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115216_95013236959125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to houseplant (highlighted by a red box)? cabinetry (highlighted by a blue box) or window (highlighted by a green box).\n(A) cabinetry\n(B) window" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333003_128371002449500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445758_65483441005916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, screen door (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) screen door\n(B) screen door" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018894_655063588691833_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429884_367830124742000_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897757_117749217265875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) chair\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662884_16507791528999_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the candle holder (highlighted by a red box)? picture frame (highlighted by a blue box) or animal (highlighted by a green box).\n(A) picture frame\n(B) animal" }, { "from": "gpt", "value": "(B) animal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115161_88094076946291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to screen door (highlighted by a red box), light (highlighted by a blue box) or light (highlighted by a green box)?\n(A) light\n(B) light" }, { "from": "gpt", "value": "(B) light" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331128_174115948636666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of floral arrangement (annotated by the red box) in reference to curtain? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333014_130233108065500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, poster (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) poster\n(B) picture frame" }, { "from": "gpt", "value": "(A) poster" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358324_18839683138291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to stairs (highlighted by a red box), glass window (highlighted by a blue box) or screen door (highlighted by a green box)?\n(A) glass window\n(B) screen door" }, { "from": "gpt", "value": "(A) glass window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115127_84780940887166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to power outlet (highlighted by a red box)? Choose from studio couch (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333674_134203764920875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, fabric (highlighted by a red box) or book (highlighted by a blue box)?\n(A) fabric\n(B) book" }, { "from": "gpt", "value": "(A) fabric" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662882_16755493518958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, screen door (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) screen door\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358121_62443083316333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from window (highlighted by a red box)? Choose among these: flower (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) flower\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669878_10508343858208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to vase (highlighted by a red box)? Select from shelf (highlighted by a blue box) and vase (highlighted by a green box).\n(A) shelf\n(B) vase" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017998_458304223393500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of cupboard (annotated by the red box) and radiator in the image provided, where is cupboard (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334052_85570539631916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to clothing (highlighted by a red box)? Choose from oven (highlighted by a blue box) and clothing (highlighted by a green box).\n(A) oven\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896020_138421585634333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, mirror (highlighted by a red box) or medicine cabinet (highlighted by a blue box)?\n(A) mirror\n(B) medicine cabinet" }, { "from": "gpt", "value": "(B) medicine cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334967_669327383624375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, coffee table (highlighted by a red box) or table (highlighted by a blue box)?\n(A) coffee table\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445198_10953026816291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of furniture (annotated by the red box) in relation to studio couch?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896591_32873730247207_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, machine (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) machine\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444883_102369997181291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, electric outlet (highlighted by a red box) or door (highlighted by a blue box)?\n(A) electric outlet\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429752_355446986381000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from houseplant (highlighted by a red box)? Choose from window sill (highlighted by a blue box) and paperback book (highlighted by a green box).\n(A) window sill\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358362_16156158978250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from chair (highlighted by a red box)? Choose among these: wide (highlighted by a blue box) or window screen (highlighted by a green box).\n(A) wide\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895936_107869526584583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bed (highlighted by a red box)? book (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) book\n(B) picture frame" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445592_284400843681083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to door (highlighted by a red box), light switch (highlighted by a blue box) or door (highlighted by a green box)?\n(A) light switch\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445769_64501883635833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from curtain (highlighted by a red box)? file cabinet (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) file cabinet\n(B) pillow" }, { "from": "gpt", "value": "(A) file cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332792_47334294336125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of television (annotated by the red box) in reference to game controller?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739716_3182776861791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the appliance (highlighted by a red box)? Choose among these: microwave oven (highlighted by a blue box) or cardboard box (highlighted by a green box).\n(A) microwave oven\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444755_80879665866208_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_408900199887250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, shelf (highlighted by a red box) or table (highlighted by a blue box)?\n(A) shelf\n(B) table" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897948_351355912112083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from plant (highlighted by a red box), window (highlighted by a blue box) or table (highlighted by a green box)?\n(A) window\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649612_36534423858750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bedside lamp (highlighted by a red box)? nightstand (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) nightstand\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896545_30100500965791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table lamp (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896074_132800108874083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to cabinet (highlighted by a red box)? basket (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) basket\n(B) pillow" }, { "from": "gpt", "value": "(A) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334789_428243279619750_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446488_356735848354666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bowl (highlighted by a red box)? Choose among these: counter top (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) counter top\n(B) cabinetry" }, { "from": "gpt", "value": "(A) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431120_348920033016916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to cabinetry (highlighted by a red box)? Select from appliance (highlighted by a blue box) and gas stove (highlighted by a green box).\n(A) appliance\n(B) gas stove" }, { "from": "gpt", "value": "(B) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670233_52884075692708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of mirror (annotated by the red box) in reference to towel bar? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333135_39306279520000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, houseplant (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) houseplant\n(B) doormat" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115358_4171805542291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to picture frame (highlighted by a red box)? Select from window (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) window\n(B) houseplant" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896009_137246262918208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to lamp (highlighted by a red box)? picture frame (highlighted by a blue box) or chair (highlighted by a green box).\n(A) picture frame\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334066_87476111521833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the screen door (highlighted by a red box)? Choose among these: towel (highlighted by a blue box) or towel (highlighted by a green box).\n(A) towel\n(B) towel" }, { "from": "gpt", "value": "(A) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739739_3928192902375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) picture frame\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261556_75566872746333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to cabinetry (highlighted by a red box)? Select from postcard (highlighted by a blue box) and bulletin board (highlighted by a green box).\n(A) postcard\n(B) bulletin board" }, { "from": "gpt", "value": "(B) bulletin board" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430814_65797681886958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from chair (highlighted by a red box)? Select from table (highlighted by a blue box) and chair (highlighted by a green box).\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898477_157324705943125_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828449_91323235483291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to door (highlighted by a red box)? umbrella (highlighted by a blue box) or radiator (highlighted by a green box).\n(A) umbrella\n(B) radiator" }, { "from": "gpt", "value": "(A) umbrella" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430310_264976241217457_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the picture frame (highlighted by a red box)? Choose among these: shelf (highlighted by a blue box) or platter (highlighted by a green box).\n(A) shelf\n(B) platter" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333657_130112468580375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the storage box (highlighted by a red box)? Choose among these: ball (highlighted by a blue box) or storage box (highlighted by a green box).\n(A) ball\n(B) storage box" }, { "from": "gpt", "value": "(A) ball" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899577_959511031919916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from concrete (highlighted by a red box)? cabinetry (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670133_40029871972250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or exhaust hood (highlighted by a blue box)?\n(A) door\n(B) exhaust hood" }, { "from": "gpt", "value": "(B) exhaust hood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670224_53951159838625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) picture frame\n(B) chair" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115265_115093264293041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018341_117152112146500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is lamp (annotated by the red box) located relative to curtain? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334869_620760821851375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to tableware (highlighted by a red box)? sink (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) sink\n(B) cabinetry" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662874_14475280647375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or plain (highlighted by a blue box)?\n(A) door\n(B) plain" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429826_746684886532416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, sink (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) sink\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115158_87682491256958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, window screen (highlighted by a red box) or toilet bowl (highlighted by a blue box)?\n(A) window screen\n(B) toilet bowl" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018844_649821319248666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of glass door (annotated by the red box) in reference to glass door?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429870_14371986922125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898350_511429081892375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from electric outlet (highlighted by a red box)? Choose among these: bottle (highlighted by a blue box) or faucet (highlighted by a green box).\n(A) bottle\n(B) faucet" }, { "from": "gpt", "value": "(B) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115448_11738250224541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47330990_177109093509500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), chair (highlighted by a blue box) or table (highlighted by a green box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334464_100923291788125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446466_355392449627000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from chair (highlighted by a red box)? Select from toy (highlighted by a blue box) and desk (highlighted by a green box).\n(A) toy\n(B) desk" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018473_527775995092958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, toy (highlighted by a red box) or tablet computer (highlighted by a blue box)?\n(A) toy\n(B) tablet computer" }, { "from": "gpt", "value": "(B) tablet computer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663401_95126293549333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47330996_177035990069041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, shelf (highlighted by a red box) or plant (highlighted by a blue box)?\n(A) shelf\n(B) plant" }, { "from": "gpt", "value": "(B) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471421819572875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or table (highlighted by a blue box)?\n(A) picture frame\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332710_109966611491375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429764_358188148192083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to shower (highlighted by a red box)? shower door (highlighted by a blue box) or towel (highlighted by a green box).\n(A) shower door\n(B) towel" }, { "from": "gpt", "value": "(A) shower door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649408_10094389504916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, coffee table (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) coffee table\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897462_470094060238291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, stool (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) stool\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896308_6692642496041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737874527574458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) table\n(B) cabinetry" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446488_356848152295958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from furniture (highlighted by a red box)? Choose among these: shelf (highlighted by a blue box) or crate (highlighted by a green box).\n(A) shelf\n(B) crate" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669881_10970905822583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from picture frame (highlighted by a red box)? picture frame (highlighted by a blue box) or door (highlighted by a green box)?\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429804_737655832480541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, screen door (highlighted by a red box) or thermostat (highlighted by a blue box)?\n(A) screen door\n(B) thermostat" }, { "from": "gpt", "value": "(B) thermostat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670158_40782140754541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to bottle (highlighted by a red box)? picture frame (highlighted by a blue box) or toaster (highlighted by a green box).\n(A) picture frame\n(B) toaster" }, { "from": "gpt", "value": "(B) toaster" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649384_11091200719791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cardboard box (highlighted by a red box)? chair (highlighted by a blue box) or bookcase (highlighted by a green box)?\n(A) chair\n(B) bookcase" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895967_406897001275041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, toy (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) toy\n(B) pillow" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017888_79807503422416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to bed (highlighted by a red box), picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896556_30871832006916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, toilet paper (highlighted by a red box) or mirror (highlighted by a blue box)?\n(A) toilet paper\n(B) mirror" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358291_15750652519708_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333292_26359541008041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to toothbrush (highlighted by a red box)? Select from houseplant (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) houseplant\n(B) bottle" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018790_17781557049083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, clothing (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) clothing\n(B) radiator" }, { "from": "gpt", "value": "(A) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430452_1995837538333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, floral arrangement (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) floral arrangement\n(B) toy" }, { "from": "gpt", "value": "(A) floral arrangement" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896411_16606313542666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, window screen (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) window screen\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331187_278109201141375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toiletry (highlighted by a red box)? bath towel (highlighted by a blue box) or toy (highlighted by a green box).\n(A) bath towel\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739414_191363559569875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, door (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) door\n(B) radiator" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649634_39419943972958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from appliance (highlighted by a red box)? appliance (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334205_103844166669458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333493_62618602703375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bouquet (highlighted by a red box)? Choose among these: notepad (highlighted by a blue box) or coffee cup (highlighted by a green box).\n(A) notepad\n(B) coffee cup" }, { "from": "gpt", "value": "(A) notepad" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896196_142331642126041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to pillow (highlighted by a red box)? Choose from nightstand (highlighted by a blue box) and window screen (highlighted by a green box).\n(A) nightstand\n(B) window screen" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333862_75528746879625_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018545_828977778954500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, sink (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) sink\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897631_139524468539000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or table (highlighted by a blue box)?\n(A) door\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260872_7289555409208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to appliance (highlighted by a red box)? Choose from dresser (highlighted by a blue box) and countertop (highlighted by a green box).\n(A) dresser\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204305_15316266941208_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358645_3197236527375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or door (highlighted by a blue box)?\n(A) chair\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332812_48057932014666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from dresser (highlighted by a red box)? chair (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331607_18506402725666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the toiletry (highlighted by a red box)? toiletry (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) toiletry\n(B) bottle" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334801_429238399311958_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897480_470935121130750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, table (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) table\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331423_544275117215291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, furniture (highlighted by a red box) or bean bag chair (highlighted by a blue box)?\n(A) furniture\n(B) bean bag chair" }, { "from": "gpt", "value": "(B) bean bag chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670109_41023803807833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, curtain (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) curtain\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446495_357716539589333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, shelf (highlighted by a red box) or shower (highlighted by a blue box)?\n(A) shelf\n(B) shower" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430795_60894067702916_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204726_23605919317166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to pillow (highlighted by a red box), side table (highlighted by a blue box) or mat (highlighted by a green box)?\n(A) side table\n(B) mat" }, { "from": "gpt", "value": "(A) side table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334624_385758525939625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to counter top (highlighted by a red box)? cabinetry (highlighted by a blue box) or home appliance (highlighted by a green box).\n(A) cabinetry\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261326_23456286334541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, book (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) book\n(B) shelf" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333562_200710368336291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, sink (highlighted by a red box) or bath (highlighted by a blue box)?\n(A) sink\n(B) bath" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828596_104249357591125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from bookcase (highlighted by a red box)? Choose from book (highlighted by a blue box) and book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828507_102525363471208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649590_35418722705833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to cabinetry (highlighted by a red box)? Choose from basket (highlighted by a blue box) and kitchen appliance (highlighted by a green box).\n(A) basket\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333840_54051570452041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhere is table (annotated by the red box) located in relation to furniture in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358176_62255642641458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446025_134727308793083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the teddy bear (highlighted by a red box)? toy (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) toy\n(B) picture frame" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670075_38565518232458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the clock (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or door (highlighted by a green box).\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429886_367934632403375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, plant (highlighted by a red box) or table (highlighted by a blue box)?\n(A) plant\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018063_718836232919000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from light fixture (highlighted by a red box)? Choose from screen door (highlighted by a blue box) and light fixture (highlighted by a green box).\n(A) screen door\n(B) light fixture" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898571_183813099484083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the christmas tree (highlighted by a red box)? gift box (highlighted by a blue box) or window (highlighted by a green box).\n(A) gift box\n(B) window" }, { "from": "gpt", "value": "(A) gift box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898621_757990809307375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to cleaning product (highlighted by a red box)? lighting (highlighted by a blue box) or cleaning product (highlighted by a green box).\n(A) lighting\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669959_27818896878625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896031_129175832905583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) chair\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358278_8988922690916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or door (highlighted by a blue box)?\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896066_131881000588958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the tile (highlighted by a red box)? Choose among these: table (highlighted by a blue box) or door (highlighted by a green box).\n(A) table\n(B) door" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261313_22335848872500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, remote (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) remote\n(B) pillow" }, { "from": "gpt", "value": "(A) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358167_60901936366291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to table (highlighted by a red box)? Choose from studio couch (highlighted by a blue box) and man (highlighted by a green box).\n(A) studio couch\n(B) man" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662959_24567494515208_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446462_354134324025208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from clothing (highlighted by a red box)? Choose from closet (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) closet\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895896_109594421694958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the screen door (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or towel bar (highlighted by a green box).\n(A) door\n(B) towel bar" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458569_154085106375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, radiator (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) radiator\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333840_54055568826916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, houseplant (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) houseplant\n(B) toy" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331283_14092292834083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, shelf (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) shelf\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333239_32236474144708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to table (highlighted by a red box)? shelf (highlighted by a blue box) or computer monitor (highlighted by a green box).\n(A) shelf\n(B) computer monitor" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649775_43382303095541_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window screen (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and window (highlighted by a green box).\n(A) studio couch\n(B) window" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430439_996658545916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to bottle (highlighted by a red box), bottle (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204390_23030780492375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, drawer (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) drawer\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896365_19947845550958_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333319_28499148697583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the plywood (highlighted by a red box)? chair (highlighted by a blue box) or notebook (highlighted by a green box).\n(A) chair\n(B) notebook" }, { "from": "gpt", "value": "(B) notebook" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739315_44735911731000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, window (highlighted by a red box) or table (highlighted by a blue box)?\n(A) window\n(B) table" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333104_108762294404625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of shelf (annotated by the red box) in reference to lamp? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896362_19788744819208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, stool (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) stool\n(B) screen door" }, { "from": "gpt", "value": "(A) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334652_389672635358666_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332026_202797502978375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663332_77493163572083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of chair (annotated by the red box) in relation to chair? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334756_421284514269375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from couch (highlighted by a red box)? Select from pillow (highlighted by a blue box) and studio couch (highlighted by a green box).\n(A) pillow\n(B) studio couch" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333523_50259988414458_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429762_356823962350583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to equipment (highlighted by a red box), chair (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) chair\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018399_392887189660541_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739828_16188378925166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from couch (highlighted by a red box)? floral arrangement (highlighted by a blue box) or table (highlighted by a green box)?\n(A) floral arrangement\n(B) table" }, { "from": "gpt", "value": "(A) floral arrangement" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332072_249965081531125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, fridge (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) fridge\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430608_315185529048083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the book (highlighted by a red box)? glass jar (highlighted by a blue box) or glass jar (highlighted by a green box).\n(A) glass jar\n(B) glass jar" }, { "from": "gpt", "value": "(A) glass jar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430288_186702967797041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of door (annotated by the red box) and sheet in the image provided, where is door (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899642_231959294908750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to material (highlighted by a red box)? Choose from bed (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) bed\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896122_145800122651541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from picture frame (highlighted by a red box)? Select from furniture (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) furniture\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896545_30088505717041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, nightstand (highlighted by a red box) or window (highlighted by a blue box)?\n(A) nightstand\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444913_220344282383875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, sink (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) sink\n(B) screen door" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649421_10682409200666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to cabinetry (highlighted by a red box)? cabinetry (highlighted by a blue box) or table (highlighted by a green box).\n(A) cabinetry\n(B) table" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261251_12623505999625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from studio couch (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739925_16382068289666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to mouthwash (highlighted by a red box)? toilet paper (highlighted by a blue box) or nightstand (highlighted by a green box).\n(A) toilet paper\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649603_36091603881000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bowl (highlighted by a red box)? chair (highlighted by a blue box) or chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204585_582618791750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, home appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) home appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358263_7199862973083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is appliance (annotated by the red box) located relative to cabinetry?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334643_388984572802958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from nightstand (highlighted by a red box)? Choose from bed (highlighted by a blue box) and lamp (highlighted by a green box).\n(A) bed\n(B) lamp" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899003_640650927696041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446485_355844348409833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, studio couch (highlighted by a red box) or coffee cup (highlighted by a blue box)?\n(A) studio couch\n(B) coffee cup" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444908_106388650984791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to microwave oven (highlighted by a red box)? Select from counter top (highlighted by a blue box) and kitchen appliance (highlighted by a green box).\n(A) counter top\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649707_47653750754541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, cabinetry (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) cabinetry\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334040_278912207422458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, studio couch (highlighted by a red box) or remote (highlighted by a blue box)?\n(A) studio couch\n(B) remote" }, { "from": "gpt", "value": "(B) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018832_649332753918916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from computer monitor (highlighted by a red box), storage box (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) storage box\n(B) shelf" }, { "from": "gpt", "value": "(A) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332585_360717139676375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, houseplant (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) houseplant\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649440_12675546982958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, countertop (highlighted by a red box) or step stool (highlighted by a blue box)?\n(A) countertop\n(B) step stool" }, { "from": "gpt", "value": "(B) step stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895571_1153716442672208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from door (highlighted by a red box)? picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334207_103224790519708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window (highlighted by a red box) or fridge (highlighted by a blue box)?\n(A) window\n(B) fridge" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115573_2628102885375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the box (highlighted by a red box)? Choose among these: box (highlighted by a blue box) or garbage (highlighted by a green box).\n(A) box\n(B) garbage" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458282_76349437495375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) door\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662962_24680399858666_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896416_17793028231083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, swivel chair (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) swivel chair\n(B) window sill" }, { "from": "gpt", "value": "(A) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898621_758038306364000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the toiletry (highlighted by a red box)? bath mat (highlighted by a blue box) or toiletry (highlighted by a green box).\n(A) bath mat\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739635_2316158027791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the tap (highlighted by a red box)? Choose among these: sink (highlighted by a blue box) or tap (highlighted by a green box).\n(A) sink\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358253_6179052624583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from christmas tree (highlighted by a red box)? Choose from pad (highlighted by a blue box) and box (highlighted by a green box).\n(A) pad\n(B) box" }, { "from": "gpt", "value": "(A) pad" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446498_357588825206875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the towel (highlighted by a red box)? Choose among these: shower door (highlighted by a blue box) or toiletry (highlighted by a green box).\n(A) shower door\n(B) toiletry" }, { "from": "gpt", "value": "(A) shower door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358234_9884766061750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, screen door (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) screen door\n(B) bed" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430441_812249760375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or book (highlighted by a blue box)?\n(A) door\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261323_23411188350458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhere is lamp (annotated by the red box) located in relation to lamp in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670291_62374624597291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to table lamp (highlighted by a red box)? Select from glass vase (highlighted by a blue box) and table (highlighted by a green box).\n(A) glass vase\n(B) table" }, { "from": "gpt", "value": "(A) glass vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430269_185567610918083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204481_24836568598208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) table\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446588_206089149714666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bulletin board (highlighted by a red box)? Choose among these: lamp (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) lamp\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895863_107761761345083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, drawer (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) drawer\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429728_19160029454333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, book (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) book\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358345_15190821036458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, light fixture (highlighted by a red box) or faucet (highlighted by a blue box)?\n(A) light fixture\n(B) faucet" }, { "from": "gpt", "value": "(A) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670356_67363487214541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) door\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897607_137243630771208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chest of drawers (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) chest of drawers\n(B) concrete" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334624_385728521535833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444513_3461447973791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from waste container (highlighted by a red box)? towel bar (highlighted by a blue box) or toilet (highlighted by a green box)?\n(A) towel bar\n(B) toilet" }, { "from": "gpt", "value": "(A) towel bar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430269_185621605645333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bottle (highlighted by a red box) or table (highlighted by a blue box)?\n(A) bottle\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333205_48128383393125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bathtub (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) bathtub\n(B) cleaning product" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663312_76646370244666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cabinetry (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) cabinetry\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739611_200250545892250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bathroom cabinet (highlighted by a red box)? ceramic tile (highlighted by a blue box) or door handle (highlighted by a green box).\n(A) ceramic tile\n(B) door handle" }, { "from": "gpt", "value": "(A) ceramic tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895623_470761044548833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, washing machine (highlighted by a red box) or power outlet (highlighted by a blue box)?\n(A) washing machine\n(B) power outlet" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897409_102983180796416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from appliance (highlighted by a red box), sink (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) sink\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018818_20036035059041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from shelf (highlighted by a red box)? Choose from basket (highlighted by a blue box) and bath towel (highlighted by a green box).\n(A) basket\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899936_863309277380083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from screen door (highlighted by a red box)? stool (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) stool\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204678_12522433679250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to toy (highlighted by a red box)? Choose from toy (highlighted by a blue box) and chair (highlighted by a green box).\n(A) toy\n(B) chair" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739629_1932972291500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, hair drier (highlighted by a red box) or underclothes (highlighted by a blue box)?\n(A) hair drier\n(B) underclothes" }, { "from": "gpt", "value": "(B) underclothes" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458447_117524581556458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, bookcase (highlighted by a red box) or book (highlighted by a blue box)?\n(A) bookcase\n(B) book" }, { "from": "gpt", "value": "(A) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429822_744781297421375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the chair (highlighted by a red box)? studio couch (highlighted by a blue box) or table (highlighted by a green box).\n(A) studio couch\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204506_718457595166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796210_1412855561250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to pillow (highlighted by a red box), bed (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) bed\n(B) picture frame" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663009_32418513649458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from chest of drawers (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and mat (highlighted by a green box).\n(A) studio couch\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334057_86284893286041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the swivel chair (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or design (highlighted by a green box).\n(A) chair\n(B) design" }, { "from": "gpt", "value": "(B) design" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896461_21746885496125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the armchair (highlighted by a red box)? Choose among these: radiator (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) radiator\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331934_163603787506166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, wrapping paper (highlighted by a red box) or handbag (highlighted by a blue box)?\n(A) wrapping paper\n(B) handbag" }, { "from": "gpt", "value": "(A) wrapping paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896231_7013721348916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the pillow (highlighted by a red box)? table (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) table\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895679_370063957427041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, curtain (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) curtain\n(B) basket" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898349_509481012764375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898343_508277606922375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) door\n(B) concrete" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018808_19365779440583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from appliance (highlighted by a red box)? Select from chair (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) chair\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429816_744528900586375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is glass box (annotated by the red box) located relative to table?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430554_301350252300541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chest of drawers (highlighted by a red box) or nightstand (highlighted by a blue box)?\n(A) chest of drawers\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899311_885895730085916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204519_1698065667166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018872_653502584367708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, houseplant (highlighted by a red box) or window (highlighted by a blue box)?\n(A) houseplant\n(B) window" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663009_32384511128291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, table (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649603_35979600408750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from desk (highlighted by a red box)? mobile phone (highlighted by a blue box) or coffee cup (highlighted by a green box)?\n(A) mobile phone\n(B) coffee cup" }, { "from": "gpt", "value": "(A) mobile phone" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331625_20138837475708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of door (annotated by the red box) in relation to bowl? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896121_145903129981041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to picture frame (highlighted by a red box)? picture frame (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333888_78835251775958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, mirror (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) mirror\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899474_954131623595500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is door (annotated by the red box) located relative to door? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896043_130149039471625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from tap (highlighted by a red box)? door (highlighted by a blue box) or towel (highlighted by a green box)?\n(A) door\n(B) towel" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897743_116082863732750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, sink (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) sink\n(B) ceramic tile" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895911_111566845873958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, basket (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) basket\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260946_4655886507291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) picture frame\n(B) lamp" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444907_106160760853250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from microwave oven (highlighted by a red box)? Select from chair (highlighted by a blue box) and chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447210_209230773098291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, furniture (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) furniture\n(B) bottle" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430510_299366862578666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, flower (highlighted by a red box) or flower (highlighted by a blue box)?\n(A) flower\n(B) flower" }, { "from": "gpt", "value": "(A) flower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458451_118206526886500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or kitchen & dining room table (highlighted by a blue box)?\n(A) chair\n(B) kitchen & dining room table" }, { "from": "gpt", "value": "(B) kitchen & dining room table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649417_10177589935708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, book (highlighted by a red box) or coffee table (highlighted by a blue box)?\n(A) book\n(B) coffee table" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018585_5488289632708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from glass table (highlighted by a red box)? table (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333564_200611774747791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, dresser (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) dresser\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333324_29354228977791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, vase (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) vase\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899640_231840092261583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chest of drawers (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) chest of drawers\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444872_98035187796333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to table lamp (highlighted by a red box)? swivel chair (highlighted by a blue box) or table (highlighted by a green box).\n(A) swivel chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115198_94367650984125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from curtain (highlighted by a red box)? curtain (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) curtain\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662897_19447202142291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, dumbbell (highlighted by a red box) or dumbbell (highlighted by a blue box)?\n(A) dumbbell\n(B) dumbbell" }, { "from": "gpt", "value": "(B) dumbbell" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458756_141616940881083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cabinetry (highlighted by a red box) or clothesline (highlighted by a blue box)?\n(A) cabinetry\n(B) clothesline" }, { "from": "gpt", "value": "(B) clothesline" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332207_264507768372875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from gas stove (highlighted by a red box)? tile (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) tile\n(B) appliance" }, { "from": "gpt", "value": "(A) tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204858_1618826467583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to mirror (highlighted by a red box)? Select from sink (highlighted by a blue box) and tap (highlighted by a green box).\n(A) sink\n(B) tap" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662870_14542370755416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, door (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) door\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445040_1789445736458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, computer monitor (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) computer monitor\n(B) toy" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458675_9317700690916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, studio couch (highlighted by a red box) or bean bag chair (highlighted by a blue box)?\n(A) studio couch\n(B) bean bag chair" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333806_51311944957083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739686_1043333906958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to picture frame (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333298_26624431929416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the plumbing fixture (highlighted by a red box)? shower (highlighted by a blue box) or plant (highlighted by a green box).\n(A) shower\n(B) plant" }, { "from": "gpt", "value": "(A) shower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899285_885267560262625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from cabinetry (highlighted by a red box)? Select from power outlet (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) power outlet\n(B) appliance" }, { "from": "gpt", "value": "(A) power outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898621_757868209842625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, counter top (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) counter top\n(B) counter top" }, { "from": "gpt", "value": "(B) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332022_202467103817125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, table (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669880_11310304585125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) chair\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662890_19624695214125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, toilet paper (highlighted by a red box) or picnic basket (highlighted by a blue box)?\n(A) toilet paper\n(B) picnic basket" }, { "from": "gpt", "value": "(B) picnic basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334189_354683359444000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, home appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) home appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334842_614768882686625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896404_16707523236833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to air conditioning (highlighted by a red box)? speaker (highlighted by a blue box) or window (highlighted by a green box).\n(A) speaker\n(B) window" }, { "from": "gpt", "value": "(A) speaker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663223_66694272580833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, footwear (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) footwear\n(B) toy" }, { "from": "gpt", "value": "(A) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444588_31799307963083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, screen door (highlighted by a red box) or window (highlighted by a blue box)?\n(A) screen door\n(B) window" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260957_5970288115708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the plank (highlighted by a red box)? furniture (highlighted by a blue box) or plank (highlighted by a green box).\n(A) furniture\n(B) plank" }, { "from": "gpt", "value": "(B) plank" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018844_649795213201000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from television (highlighted by a red box)? desk (highlighted by a blue box) or table (highlighted by a green box)?\n(A) desk\n(B) table" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333876_77226372606333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, oven (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) oven\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331159_181765008535375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, lamp (highlighted by a red box) or menu (highlighted by a blue box)?\n(A) lamp\n(B) menu" }, { "from": "gpt", "value": "(B) menu" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334934_663219596353916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the book (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828442_91394140679583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, curtain (highlighted by a red box) or light (highlighted by a blue box)?\n(A) curtain\n(B) light" }, { "from": "gpt", "value": "(B) light" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649802_46841299091416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the pillow (highlighted by a red box)? Choose among these: studio couch (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430212_688675349601416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bottle (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and paper towel (highlighted by a green box).\n(A) cabinetry\n(B) paper towel" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333810_51918859849041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to desk (highlighted by a red box), computer monitor (highlighted by a blue box) or mouse (highlighted by a green box)?\n(A) computer monitor\n(B) mouse" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739281_42566768354958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to wood burning stove (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018339_117104914555708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, table (highlighted by a red box) or box (highlighted by a blue box)?\n(A) table\n(B) box" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662960_24776795027375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the toiletry (highlighted by a red box)? bath (highlighted by a blue box) or mirror (highlighted by a green box).\n(A) bath\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334609_385042646031083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toy car (highlighted by a red box), curtain (highlighted by a blue box) or toy (highlighted by a green box)?\n(A) curtain\n(B) toy" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333875_76139472525208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from infant bed (highlighted by a red box)? Select from furniture (highlighted by a blue box) and door (highlighted by a green box).\n(A) furniture\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670150_40451638223791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from chest of drawers (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331028_474728319331333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of chair (annotated by the red box) in reference to table? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333876_77238367736208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cupboard (highlighted by a red box) or glass plate (highlighted by a blue box)?\n(A) cupboard\n(B) glass plate" }, { "from": "gpt", "value": "(A) cupboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430209_688498754154541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to cabinetry (highlighted by a red box)? cabinetry (highlighted by a blue box) or cabinet (highlighted by a green box).\n(A) cabinetry\n(B) cabinet" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331170_274340873317500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bed (highlighted by a red box)? nightstand (highlighted by a blue box) or table lamp (highlighted by a green box).\n(A) nightstand\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11187710689500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, book cover (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) book cover\n(B) paperback book" }, { "from": "gpt", "value": "(A) book cover" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018815_19980740731250_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331432_546054304710541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to balloon (highlighted by a red box), armchair (highlighted by a blue box) or balloon (highlighted by a green box)?\n(A) armchair\n(B) balloon" }, { "from": "gpt", "value": "(A) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828150_73489798485291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895274_79173011230791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or hand towel (highlighted by a blue box)?\n(A) cabinetry\n(B) hand towel" }, { "from": "gpt", "value": "(B) hand towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896117_145996724463958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, picture frame (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333331_29940931362166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, toothbrush (highlighted by a red box) or toilet (highlighted by a blue box)?\n(A) toothbrush\n(B) toilet" }, { "from": "gpt", "value": "(B) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115227_95952840332000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796477_4142725044291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is beach towel (annotated by the red box) located in relation to beach towel in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24563502729791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to shelf (highlighted by a red box)? bookcase (highlighted by a blue box) or book (highlighted by a green box).\n(A) bookcase\n(B) book" }, { "from": "gpt", "value": "(A) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739255_39641229502250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from bottle (highlighted by a red box)? cleaning product (highlighted by a blue box) or wide (highlighted by a green box)?\n(A) cleaning product\n(B) wide" }, { "from": "gpt", "value": "(B) wide" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662962_24672386361916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, lamp (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) lamp\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649474_14637230540416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from studio couch (highlighted by a red box), pillow (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) pillow\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334914_1090103671486000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to window (highlighted by a red box)? Select from lantern (highlighted by a blue box) and gas stove (highlighted by a green box).\n(A) lantern\n(B) gas stove" }, { "from": "gpt", "value": "(B) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429729_19013639109208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or book (highlighted by a blue box)?\n(A) chair\n(B) book" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018087_104059922016291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toiletry (highlighted by a red box), mouthwash (highlighted by a blue box) or cleaning product (highlighted by a green box)?\n(A) mouthwash\n(B) cleaning product" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739926_16293570000208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, television (highlighted by a red box) or toilet bowl (highlighted by a blue box)?\n(A) television\n(B) toilet bowl" }, { "from": "gpt", "value": "(B) toilet bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017887_80052904273875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, box (highlighted by a red box) or box (highlighted by a blue box)?\n(A) box\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261686_3847945614166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picnic basket (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) picnic basket\n(B) basket" }, { "from": "gpt", "value": "(A) picnic basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430089_27763256088000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of poster (annotated by the red box) in relation to toy? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739329_45627715181125_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332204_264225182969333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or couch (highlighted by a blue box)?\n(A) chair\n(B) couch" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458282_76389438351166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from picture frame (highlighted by a red box)? lamp (highlighted by a blue box) or couch (highlighted by a green box)?\n(A) lamp\n(B) couch" }, { "from": "gpt", "value": "(B) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663258_77870873818500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bath (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) bath\n(B) furniture" }, { "from": "gpt", "value": "(A) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332397_401448516010541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, screen door (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) screen door\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444695_72616579188833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to picture frame (highlighted by a red box)? table (highlighted by a blue box) or glass door (highlighted by a green box).\n(A) table\n(B) glass door" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899282_885239555213791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to tile (highlighted by a red box)? Select from stairwell (highlighted by a blue box) and postcard (highlighted by a green box).\n(A) stairwell\n(B) postcard" }, { "from": "gpt", "value": "(B) postcard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018415_394371234530958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toaster (highlighted by a red box), table (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) table\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332489_341244292606250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bath (highlighted by a red box) or soap dispenser (highlighted by a blue box)?\n(A) bath\n(B) soap dispenser" }, { "from": "gpt", "value": "(B) soap dispenser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429824_746599587630250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of air conditioning (annotated by the red box) and exhaust hood in the image provided, where is air conditioning (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662908_20208847630000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from book (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) pillow\n(B) electric outlet" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670124_41664479893500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bottle (highlighted by a red box)? cabinetry (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897462_470068071016500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, studio couch (highlighted by a red box) or entertainment center (highlighted by a blue box)?\n(A) studio couch\n(B) entertainment center" }, { "from": "gpt", "value": "(B) entertainment center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471469816285416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or kitchen & dining room table (highlighted by a blue box)?\n(A) chair\n(B) kitchen & dining room table" }, { "from": "gpt", "value": "(B) kitchen & dining room table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430293_187354353440833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or book (highlighted by a blue box)?\n(A) table\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899352_715969282859708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, counter top (highlighted by a red box) or luggage (highlighted by a blue box)?\n(A) counter top\n(B) luggage" }, { "from": "gpt", "value": "(A) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204474_24939377876750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or box (highlighted by a blue box)?\n(A) cabinetry\n(B) box" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261096_1274444299541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, bottle (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) bottle\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332946_20787035629291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of picture frame (annotated by the red box) in relation to light?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358673_933098863041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from kitchen & dining room table (highlighted by a red box)? Choose from chair (highlighted by a blue box) and chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649639_39661443878916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, glass vase (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) glass vase\n(B) electric outlet" }, { "from": "gpt", "value": "(A) glass vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796191_550730344333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of picture frame (annotated by the red box) and door in the image provided, where is picture frame (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334057_86219986227958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, stationary bicycle (highlighted by a red box) or paper towel (highlighted by a blue box)?\n(A) stationary bicycle\n(B) paper towel" }, { "from": "gpt", "value": "(B) paper towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446493_356510657157500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from appliance (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and window (highlighted by a green box).\n(A) cabinetry\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663322_77615662647375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to radiator (highlighted by a red box)? chair (highlighted by a blue box) or light fixture (highlighted by a green box).\n(A) chair\n(B) light fixture" }, { "from": "gpt", "value": "(B) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897655_147155781527125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, studio couch (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) studio couch\n(B) counter top" }, { "from": "gpt", "value": "(B) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445100_9192782469250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of window (annotated by the red box) in reference to curtain?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334890_623277947325000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, curtain (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) curtain\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444762_81589470069750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toilet paper (highlighted by a red box)? bottle (highlighted by a blue box) or chest of drawers (highlighted by a green box).\n(A) bottle\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828449_91285233903500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from studio couch (highlighted by a red box)? Choose from side table (highlighted by a blue box) and fireplace (highlighted by a green box).\n(A) side table\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649742_49552998401708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, furniture (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) furniture\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260957_5986298451708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) window\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898786_67362014647332_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to christmas tree (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and throw pillow (highlighted by a green box).\n(A) studio couch\n(B) throw pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018113_368471021987875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from countertop (highlighted by a red box)? Select from chair (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) chair\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_4892193054125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from bowl (highlighted by a red box)? mat (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) mat\n(B) chair" }, { "from": "gpt", "value": "(A) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444706_73264576100333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, nightstand (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430862_74317892862958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, furniture (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) furniture\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898261_696851431456958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, computer monitor (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) computer monitor\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358645_3274237979291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to sink (highlighted by a red box), cabinetry (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663330_77419960602500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662905_20056161107041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, desk (highlighted by a red box) or table (highlighted by a blue box)?\n(A) desk\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430944_96285751316750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, clock (highlighted by a red box) or window (highlighted by a blue box)?\n(A) clock\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334879_621770818206958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to desk (highlighted by a red box)? Choose from chair (highlighted by a blue box) and paperback book (highlighted by a green box).\n(A) chair\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018487_529096862434000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the book (highlighted by a red box)? Choose among these: shelf (highlighted by a blue box) or book (highlighted by a green box).\n(A) shelf\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444709_74144414115000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chest of drawers (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) chest of drawers\n(B) lamp" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670218_54015966257791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to radiator (highlighted by a red box)? light switch (highlighted by a blue box) or door (highlighted by a green box).\n(A) light switch\n(B) door" }, { "from": "gpt", "value": "(A) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261344_24355541044333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to chair (highlighted by a red box)? Select from table (highlighted by a blue box) and table (highlighted by a green box).\n(A) table\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334849_615458536704875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toilet bowl (highlighted by a red box), toilet paper (highlighted by a blue box) or movie poster (highlighted by a green box)?\n(A) toilet paper\n(B) movie poster" }, { "from": "gpt", "value": "(B) movie poster" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897478_112699149767916_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204724_23476522985791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chair (highlighted by a red box)? chair (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) chair\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445869_71863096310166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from lamp (highlighted by a red box), nightstand (highlighted by a blue box) or bed (highlighted by a green box)?\n(A) nightstand\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333581_207636033433875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) chair\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334195_355859323705541_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24315804200625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, person (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) person\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895591_1161464577748750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) picture frame\n(B) shelf" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895863_107802161276291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to plain (highlighted by a red box)? Select from book (highlighted by a blue box) and lamp (highlighted by a green box).\n(A) book\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899307_885757936830416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from baby carriage (highlighted by a red box)? person (highlighted by a blue box) or door (highlighted by a green box)?\n(A) person\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115445_11865047697333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, clothing (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) clothing\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899957_865518967316000_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899968_712561880625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, drawer (highlighted by a red box) or cabinet (highlighted by a blue box)?\n(A) drawer\n(B) cabinet" }, { "from": "gpt", "value": "(A) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204795_24307827224791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to sink (highlighted by a red box)? Choose from soap (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) soap\n(B) houseplant" }, { "from": "gpt", "value": "(A) soap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354591020827000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to chair (highlighted by a red box)? pillow (highlighted by a blue box) or table (highlighted by a green box).\n(A) pillow\n(B) table" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896174_140822424313125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of fireplace (annotated by the red box) in relation to lamp?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895908_110748940874125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from pillow (highlighted by a red box)? Choose among these: table (highlighted by a blue box) or table lamp (highlighted by a green box).\n(A) table\n(B) table lamp" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334754_421203713643833_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261294_16264831946083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the radiator (highlighted by a red box)? Choose among these: bath towel (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) bath towel\n(B) shelf" }, { "from": "gpt", "value": "(A) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332606_363392320326583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of poster (annotated by the red box) in relation to door? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261164_769912074166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to door (highlighted by a red box)? pillow (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669881_11004909033916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bar stool (highlighted by a red box)? Choose from chest of drawers (highlighted by a blue box) and bar stool (highlighted by a green box).\n(A) chest of drawers\n(B) bar stool" }, { "from": "gpt", "value": "(B) bar stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739635_2322155544291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, sink (highlighted by a red box) or bath (highlighted by a blue box)?\n(A) sink\n(B) bath" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739281_42598771777708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from book (highlighted by a red box)? book (highlighted by a blue box) or armchair (highlighted by a green box)?\n(A) book\n(B) armchair" }, { "from": "gpt", "value": "(B) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828150_73401402051500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or cupboard (highlighted by a blue box)?\n(A) cabinetry\n(B) cupboard" }, { "from": "gpt", "value": "(B) cupboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11263695801916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from picture frame (highlighted by a red box)? picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018487_529074871469791_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828311_76564529445416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to mirror (highlighted by a red box)? Choose from appliance (highlighted by a blue box) and plant (highlighted by a green box).\n(A) appliance\n(B) plant" }, { "from": "gpt", "value": "(B) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739686_1047348979250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to studio couch (highlighted by a red box)? Select from pillow (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895298_90997128126000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to chair (highlighted by a red box)? Choose from magazine (highlighted by a blue box) and table (highlighted by a green box).\n(A) magazine\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018307_109090177704458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or swivel chair (highlighted by a blue box)?\n(A) chair\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358691_3244529229541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from dresser (highlighted by a red box), pillow (highlighted by a blue box) or studio couch (highlighted by a green box)?\n(A) pillow\n(B) studio couch" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895614_470447103425500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, appliance (highlighted by a red box) or wood (highlighted by a blue box)?\n(A) appliance\n(B) wood" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333283_25423436354166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) picture frame\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828441_91482339056666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from clock (highlighted by a red box)? Choose among these: window (highlighted by a blue box) or window screen (highlighted by a green box).\n(A) window\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430942_95494784011291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toilet paper (highlighted by a red box) or paper towel (highlighted by a blue box)?\n(A) toilet paper\n(B) paper towel" }, { "from": "gpt", "value": "(B) paper towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115624_3663098612000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from appliance (highlighted by a red box)? appliance (highlighted by a blue box) or light fixture (highlighted by a green box)?\n(A) appliance\n(B) light fixture" }, { "from": "gpt", "value": "(B) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334714_533671584879750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, printer (highlighted by a red box) or file cabinet (highlighted by a blue box)?\n(A) printer\n(B) file cabinet" }, { "from": "gpt", "value": "(B) file cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898651_572749825329416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, table (highlighted by a red box) or condominium (highlighted by a blue box)?\n(A) table\n(B) condominium" }, { "from": "gpt", "value": "(B) condominium" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739563_198342151043916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or material (highlighted by a green box).\n(A) cabinetry\n(B) material" }, { "from": "gpt", "value": "(B) material" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333265_21732107864458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bottle (highlighted by a red box) or tile (highlighted by a blue box)?\n(A) bottle\n(B) tile" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663322_77553655106333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, appliance (highlighted by a red box) or countertop (highlighted by a blue box)?\n(A) appliance\n(B) countertop" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895591_1161430574835125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, home appliance (highlighted by a red box) or toilet bowl (highlighted by a blue box)?\n(A) home appliance\n(B) toilet bowl" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115361_860469128666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333659_130396170003541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, shelf (highlighted by a red box) or window (highlighted by a blue box)?\n(A) shelf\n(B) window" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018832_649276260156958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from drawer (highlighted by a red box)? Select from bed (highlighted by a blue box) and footwear (highlighted by a green box).\n(A) bed\n(B) footwear" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430598_315301514765208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, window (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) window\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445843_69305652066915_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, television (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) television\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895272_79448399338250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from curtain (highlighted by a red box)? window (highlighted by a blue box) or studio couch (highlighted by a green box)?\n(A) window\n(B) studio couch" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444917_220420867839958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, window (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) window\n(B) window sill" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430800_61155861713875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, clock (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) clock\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895279_79215910500375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) window\n(B) desk" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662829_15211601389041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670063_37977520987500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of mirror (annotated by the red box) and window in the image provided, where is mirror (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115180_104059744938916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, curtain (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) curtain\n(B) pillow" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115519_13182177491875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to toiletry (highlighted by a red box)? Select from toiletry (highlighted by a blue box) and toiletry (highlighted by a green box).\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018708_545436263405416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of stairs (annotated by the red box) in relation to curtain?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018524_821521993493375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, control (highlighted by a red box) or control (highlighted by a blue box)?\n(A) control\n(B) control" }, { "from": "gpt", "value": "(B) control" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896103_145404907549291_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662959_24569493724250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from toiletry (highlighted by a red box)? Select from sink (highlighted by a blue box) and mirror (highlighted by a green box).\n(A) sink\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670350_67522590951333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is furniture (annotated by the red box) located in relation to blanket in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331183_277542211884333_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333949_45739793753833_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458260_74351042218541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the door (highlighted by a red box)? Choose among these: stairs (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) stairs\n(B) cabinetry" }, { "from": "gpt", "value": "(A) stairs" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895936_107845519413583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bowl (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bowl\n(B) bottle" }, { "from": "gpt", "value": "(A) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899057_647078692272250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, stairs (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) stairs\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796492_1646076207500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to screen door (highlighted by a red box)? door (highlighted by a blue box) or light switch (highlighted by a green box).\n(A) door\n(B) light switch" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331812_228095376331875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from table (highlighted by a red box)? chair (highlighted by a blue box) or stairwell (highlighted by a green box)?\n(A) chair\n(B) stairwell" }, { "from": "gpt", "value": "(B) stairwell" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828272_84550792273083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897720_114150639901791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, furniture (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) furniture\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896169_140735525362458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is studio couch (annotated by the red box) located relative to pillow?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333323_29413121706166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444511_3383846605083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bathroom cabinet (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) bathroom cabinet\n(B) toiletry" }, { "from": "gpt", "value": "(A) bathroom cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333205_48088183004166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, appliance (highlighted by a red box) or shower door (highlighted by a blue box)?\n(A) appliance\n(B) shower door" }, { "from": "gpt", "value": "(B) shower door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896522_34672332686125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the paperback book (highlighted by a red box)? Choose among these: paperback book (highlighted by a blue box) or paperback book (highlighted by a green box).\n(A) paperback book\n(B) paperback book" }, { "from": "gpt", "value": "(A) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018284_799356115470833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or plant (highlighted by a blue box)?\n(A) chair\n(B) plant" }, { "from": "gpt", "value": "(B) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444574_31875810236916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to counter top (highlighted by a red box)? electric outlet (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) electric outlet\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430690_327461982744791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, curtain (highlighted by a red box) or window (highlighted by a blue box)?\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458688_9243498241291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is mirror (annotated by the red box) located in relation to studio couch in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796684_30821134476583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of furniture (annotated by the red box) in relation to door? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358250_6011852098583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) window\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429765_358270647959458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from toilet paper (highlighted by a red box)? table (highlighted by a blue box) or toilet paper (highlighted by a green box)?\n(A) table\n(B) toilet paper" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897948_351333904530791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, curtain (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) curtain\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24834508045666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to picture frame (highlighted by a red box), picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444574_31883806992375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) chair\n(B) cabinetry" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332992_125217689982250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796279_910861486208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the toiletry (highlighted by a red box)? bath (highlighted by a blue box) or cleaning product (highlighted by a green box).\n(A) bath\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670184_51647738702000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bed (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) bed\n(B) picture frame" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896035_129261732264750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from book (highlighted by a red box)? picture frame (highlighted by a blue box) or book (highlighted by a green box)?\n(A) picture frame\n(B) book" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458562_128114212475666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from bottle (highlighted by a red box)? Select from bottle (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261485_41950869235333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from furniture (highlighted by a red box)? curtain (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) curtain\n(B) pillow" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895179_37903669909958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from table lamp (highlighted by a red box)? Choose among these: furniture (highlighted by a blue box) or magazine (highlighted by a green box).\n(A) furniture\n(B) magazine" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446497_357480935952208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115217_94924740505291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, refrigerator (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) refrigerator\n(B) shelf" }, { "from": "gpt", "value": "(A) refrigerator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458301_77391218941875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, clothing (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) clothing\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332519_415988445918083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or box (highlighted by a blue box)?\n(A) door\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260877_7387164833375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from appliance (highlighted by a red box)? countertop (highlighted by a blue box) or wok (highlighted by a green box)?\n(A) countertop\n(B) wok" }, { "from": "gpt", "value": "(B) wok" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444721_75300063871083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is waste container (annotated by the red box) located relative to concrete? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897655_147075080818583_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897924_348983829526458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, mug (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) mug\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828596_104251356799541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to book (highlighted by a red box)? book (highlighted by a blue box) or bookshelf (highlighted by a green box).\n(A) book\n(B) bookshelf" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115217_94892737109041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895199_39393027188916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to cabinetry (highlighted by a red box)? Select from plant (highlighted by a blue box) and door (highlighted by a green box).\n(A) plant\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662829_15217598904166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from cabinetry (highlighted by a red box), bottle (highlighted by a blue box) or door (highlighted by a green box)?\n(A) bottle\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649464_13883129043666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, book (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) book\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669959_27844886065583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from beach towel (highlighted by a red box)? door (highlighted by a blue box) or countertop (highlighted by a green box)?\n(A) door\n(B) countertop" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331276_12771443434375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, appliance (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) appliance\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24577513652666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, studio couch (highlighted by a red box) or plywood (highlighted by a blue box)?\n(A) studio couch\n(B) plywood" }, { "from": "gpt", "value": "(B) plywood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458562_128110214136666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bottle (highlighted by a red box)? Choose from box (highlighted by a blue box) and box (highlighted by a green box).\n(A) box\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796684_30847140309166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, footwear (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) footwear\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358118_62529280983208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to picture frame (highlighted by a red box)? Choose from appliance (highlighted by a blue box) and television (highlighted by a green box).\n(A) appliance\n(B) television" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334491_104490022970125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, computer chair (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) computer chair\n(B) curtain" }, { "from": "gpt", "value": "(A) computer chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333838_54142566839250_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670291_62364611897625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table lamp (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) table lamp\n(B) studio couch" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429765_358238644318041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bathtub (highlighted by a red box) or faucet (highlighted by a blue box)?\n(A) bathtub\n(B) faucet" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670311_64366842687583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, mirror (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) mirror\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332505_343944877349541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to infant bed (highlighted by a red box)? swivel chair (highlighted by a blue box) or book (highlighted by a green box).\n(A) swivel chair\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018284_799348118709666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the desk (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) cabinetry\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898261_697058229480375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, table (highlighted by a red box) or window (highlighted by a blue box)?\n(A) table\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896490_31600347975375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261675_3129440744041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cabinetry (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) cabinetry\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649643_40403117099458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bottle (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) bottle\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896195_142266034756166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) door\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429822_744769302326958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, curtain (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) curtain\n(B) shelf" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018068_98206978824541_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261344_24331550547750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to candle holder (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) picture frame\n(B) screen door" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334194_355819023357208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bath (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) bath\n(B) paperback book" }, { "from": "gpt", "value": "(A) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897712_112103290098458_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445721_63553104247833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) door\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430288_186638960477666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, refrigerator (highlighted by a red box) or beach towel (highlighted by a blue box)?\n(A) refrigerator\n(B) beach towel" }, { "from": "gpt", "value": "(B) beach towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261313_22291850443958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to window (highlighted by a red box)? Select from radiator (highlighted by a blue box) and window sill (highlighted by a green box).\n(A) radiator\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899060_648266341588750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from mirror (highlighted by a red box)? Choose from light (highlighted by a blue box) and toilet paper (highlighted by a green box).\n(A) light\n(B) toilet paper" }, { "from": "gpt", "value": "(A) light" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430820_65679179797125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, tableware (highlighted by a red box) or glass plate (highlighted by a blue box)?\n(A) tableware\n(B) glass plate" }, { "from": "gpt", "value": "(B) glass plate" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430677_326554070485875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261358_25915530646208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) picture frame\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444892_104057897243500_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895910_110950540392083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, furniture (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) furniture\n(B) furniture" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458366_100826551332625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chest of drawers (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) chest of drawers\n(B) table lamp" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332158_260120624870000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, cabinetry (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) cabinetry\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334801_429250394462416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, vase (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) vase\n(B) houseplant" }, { "from": "gpt", "value": "(A) vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898248_167815024539500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the picture frame (highlighted by a red box)? curtain (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) curtain\n(B) picture frame" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898625_757758205081833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from waste container (highlighted by a red box)? bottle (highlighted by a blue box) or toilet paper (highlighted by a green box)?\n(A) bottle\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458561_128021217722875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, cabinetry (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) cabinetry\n(B) doormat" }, { "from": "gpt", "value": "(B) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445677_61052017230250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the book (highlighted by a red box)? Choose among these: bean bag chair (highlighted by a blue box) or bookcase (highlighted by a green box).\n(A) bean bag chair\n(B) bookcase" }, { "from": "gpt", "value": "(B) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261228_13778707571083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to chair (highlighted by a red box)? Choose from bar stool (highlighted by a blue box) and chair (highlighted by a green box).\n(A) bar stool\n(B) chair" }, { "from": "gpt", "value": "(A) bar stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669851_12497861166041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the trash bin/can (highlighted by a red box)? glass door (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) glass door\n(B) screen door" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333963_46788137886166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332290_385261594572416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from light fixture (highlighted by a red box), chair (highlighted by a blue box) or window (highlighted by a green box)?\n(A) chair\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898959_821211706628166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the projection screen (highlighted by a red box)? Choose among these: microwave oven (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) microwave oven\n(B) electric outlet" }, { "from": "gpt", "value": "(A) microwave oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445697_62741099016583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, door handle (highlighted by a red box) or light switch (highlighted by a blue box)?\n(A) door handle\n(B) light switch" }, { "from": "gpt", "value": "(A) door handle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115143_87044472905041_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446493_356394654487708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cabinetry (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739902_15024079638666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from chair (highlighted by a red box)? Choose from glass door (highlighted by a blue box) and table (highlighted by a green box).\n(A) glass door\n(B) table" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334189_354685358637166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from appliance (highlighted by a red box), food (highlighted by a blue box) or electric outlet (highlighted by a green box)?\n(A) food\n(B) electric outlet" }, { "from": "gpt", "value": "(A) food" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896089_143902093756041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, doormat (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) doormat\n(B) screen door" }, { "from": "gpt", "value": "(A) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018107_367920922823500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from wall clock (highlighted by a red box)? houseplant (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) houseplant\n(B) curtain" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204325_14407307985500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of desk (annotated by the red box) in relation to boat?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649586_35295223859208_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895272_79494413931791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from appliance (highlighted by a red box)? desk (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) desk\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331041_479825028121541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chair (highlighted by a red box)? chair (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) chair\n(B) shelf" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261571_76479421664416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, flower (highlighted by a red box) or nightstand (highlighted by a blue box)?\n(A) flower\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334892_623342554483166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to mouthwash (highlighted by a red box)? Choose from cleaning product (highlighted by a blue box) and mouthwash (highlighted by a green box).\n(A) cleaning product\n(B) mouthwash" }, { "from": "gpt", "value": "(B) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334917_1090074366633707_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, cabinetry (highlighted by a red box) or oven (highlighted by a blue box)?\n(A) cabinetry\n(B) oven" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739611_200256543521250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, toilet paper (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) toilet paper\n(B) toilet paper" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333283_25399429480875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to chair (highlighted by a red box)? Select from desk (highlighted by a blue box) and mirror (highlighted by a green box).\n(A) desk\n(B) mirror" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662959_24585487399375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, light fixture (highlighted by a red box) or cabinet (highlighted by a blue box)?\n(A) light fixture\n(B) cabinet" }, { "from": "gpt", "value": "(A) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204474_25083570650333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, remote (highlighted by a red box) or remote (highlighted by a blue box)?\n(A) remote\n(B) remote" }, { "from": "gpt", "value": "(A) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899198_186547782134791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from dresser (highlighted by a red box), appliance (highlighted by a blue box) or window screen (highlighted by a green box)?\n(A) appliance\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897709_111962298947750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the cabinetry (highlighted by a red box)? floral arrangement (highlighted by a blue box) or sink (highlighted by a green box).\n(A) floral arrangement\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896170_140606626329958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, fireplace (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) fireplace\n(B) chair" }, { "from": "gpt", "value": "(A) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332467_886346768242000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) curtain\n(B) lamp" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458231_78560006155666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to kitchen appliance (highlighted by a red box), kitchen appliance (highlighted by a blue box) or kitchen appliance (highlighted by a green box)?\n(A) kitchen appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898189_145070428925791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) door\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018804_18860893846541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from studio couch (highlighted by a red box)? Select from furniture (highlighted by a blue box) and cage (highlighted by a green box).\n(A) furniture\n(B) cage" }, { "from": "gpt", "value": "(B) cage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670191_51477542649375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chest of drawers (highlighted by a red box) or mirror (highlighted by a blue box)?\n(A) chest of drawers\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332605_363332527839958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, dresser (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) dresser\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334947_664847286556208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, door (highlighted by a red box) or bicycle (highlighted by a blue box)?\n(A) door\n(B) bicycle" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354647031251541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649742_49581003474750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of table (annotated by the red box) in reference to game controller? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670186_51540933049708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chest of drawers (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) chest of drawers\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828565_102104678704875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from lamp (highlighted by a red box)? screen door (highlighted by a blue box) or swivel chair (highlighted by a green box)?\n(A) screen door\n(B) swivel chair" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896162_139853578442791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cleaning product (highlighted by a red box)? Choose from cleaning product (highlighted by a blue box) and cleaning product (highlighted by a green box).\n(A) cleaning product\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446025_134693306161249_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, baby carriage (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) baby carriage\n(B) cardboard box" }, { "from": "gpt", "value": "(A) baby carriage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649798_46152504935333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the fireplace (highlighted by a red box)? Choose among these: wood burning stove (highlighted by a blue box) or table (highlighted by a green box).\n(A) wood burning stove\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670064_37865317560666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, table (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) table\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115352_4065016561666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to swivel chair (highlighted by a red box), table (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446479_355640748338041_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204761_26622214202791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or plant (highlighted by a green box).\n(A) picture frame\n(B) plant" }, { "from": "gpt", "value": "(B) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204481_24850679678958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the picture frame (highlighted by a red box)? studio couch (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334934_663207601224750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from mechanical fan (highlighted by a red box)? pillow (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) pillow\n(B) lamp" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649707_47661747443916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cabinetry (highlighted by a red box) or paper towel (highlighted by a blue box)?\n(A) cabinetry\n(B) paper towel" }, { "from": "gpt", "value": "(B) paper towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333332_30023930954958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, washing machine (highlighted by a red box) or laundry (highlighted by a blue box)?\n(A) washing machine\n(B) laundry" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331476_151106235575333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334566_68526727195707_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, computer monitor (highlighted by a red box) or computer screen (highlighted by a blue box)?\n(A) computer monitor\n(B) computer screen" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796562_15996474390916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, furniture (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) furniture\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897732_115031396866000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, nightstand (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24770501038750_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445169_7901232785541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the radiator (highlighted by a red box)? wall clock (highlighted by a blue box) or light fixture (highlighted by a green box).\n(A) wall clock\n(B) light fixture" }, { "from": "gpt", "value": "(B) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896560_30738118257166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to shelf (highlighted by a red box)? Select from bed (highlighted by a blue box) and window (highlighted by a green box).\n(A) bed\n(B) window" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458637_128149477717666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cardboard box (highlighted by a red box) or plastic bag (highlighted by a blue box)?\n(A) cardboard box\n(B) plastic bag" }, { "from": "gpt", "value": "(B) plastic bag" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446466_355456456875458_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204316_15875050975625_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333111_108663684385000_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896009_137196267157583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333331_29946928928125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from toiletry (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and mouthwash (highlighted by a green box).\n(A) cabinetry\n(B) mouthwash" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899664_234604266828333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from door (highlighted by a red box)? Choose from table lamp (highlighted by a blue box) and chandelier (highlighted by a green box).\n(A) table lamp\n(B) chandelier" }, { "from": "gpt", "value": "(B) chandelier" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431034_141341261574458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhere is elevator (annotated by the red box) located in relation to door in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898334_506677083682166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from concrete (highlighted by a red box)? light switch (highlighted by a blue box) or electric outlet (highlighted by a green box)?\n(A) light switch\n(B) electric outlet" }, { "from": "gpt", "value": "(A) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115445_11803040059208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of chest of drawers (annotated by the red box) and basket in the image provided, where is chest of drawers (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42923208_1908096935791_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898541_180950749036166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, computer monitor (highlighted by a red box) or computer monitor (highlighted by a blue box)?\n(A) computer monitor\n(B) computer monitor" }, { "from": "gpt", "value": "(B) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828435_90486641710583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from ceramic tile (highlighted by a red box)? water heater (highlighted by a blue box) or screen door (highlighted by a green box)?\n(A) water heater\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458235_78481205476875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the appliance (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446492_356639054655958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, countertop (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) countertop\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662812_14675703580708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from clothing (highlighted by a red box)? Choose among these: hanger (highlighted by a blue box) or clothing (highlighted by a green box).\n(A) hanger\n(B) clothing" }, { "from": "gpt", "value": "(A) hanger" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333564_200621770724625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bath mat (highlighted by a red box)? bathtub (highlighted by a blue box) or toilet bowl (highlighted by a green box).\n(A) bathtub\n(B) toilet bowl" }, { "from": "gpt", "value": "(B) toilet bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899600_202642430093791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, curtain (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) curtain\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261562_75456968263125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cabinetry (highlighted by a red box)? cabinetry (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358645_3290231353500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to door (highlighted by a red box)? tile (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) tile\n(B) picture frame" }, { "from": "gpt", "value": "(A) tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663051_36181361392125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chest of drawers (highlighted by a red box) or alarm clock (highlighted by a blue box)?\n(A) chest of drawers\n(B) alarm clock" }, { "from": "gpt", "value": "(B) alarm clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430067_34755282568541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, basket (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) basket\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261158_684912389208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670318_64287140914375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333599_75252776757583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from square (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and mat (highlighted by a green box).\n(A) furniture\n(B) mat" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896358_18587409900083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from studio couch (highlighted by a red box)? chair (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204726_23637922690833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, curtain (highlighted by a red box) or window (highlighted by a blue box)?\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333600_75341790617625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261100_1149146202000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to cabinetry (highlighted by a red box)? drawer (highlighted by a blue box) or home appliance (highlighted by a green box).\n(A) drawer\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261541_74257330024791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or writing (highlighted by a blue box)?\n(A) chair\n(B) writing" }, { "from": "gpt", "value": "(B) writing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018107_367912926145625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, mirror (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) mirror\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332321_390726565423416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, countertop (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) countertop\n(B) electric outlet" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828437_90436045207083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from curtain (highlighted by a red box), window (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) window\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331008_181876484387041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, closet (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) closet\n(B) appliance" }, { "from": "gpt", "value": "(A) closet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444517_3733533531750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, mouthwash (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) mouthwash\n(B) tap" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898917_816780145973500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to countertop (highlighted by a red box)? cabinetry (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332992_125228485630500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, curtain (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) curtain\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332156_260013834790541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is bookcase (annotated by the red box) located relative to chair? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332777_44526953229833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from table (highlighted by a red box)? Select from chair (highlighted by a blue box) and chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446574_86376071930625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the chair (highlighted by a red box)? Choose among these: kitchen & dining room table (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) kitchen & dining room table\n(B) houseplant" }, { "from": "gpt", "value": "(A) kitchen & dining room table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898988_823906990954166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to television (highlighted by a red box), lamp (highlighted by a blue box) or power outlet (highlighted by a green box)?\n(A) lamp\n(B) power outlet" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445670_60940713469625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the curtain (highlighted by a red box)? curtain (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) curtain\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331491_153090720068833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, desktop computer (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) desktop computer\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649692_36084261501875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, pillow (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) pillow\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358230_10026157475625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is vanity (annotated by the red box) located in relation to cupboard in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204892_852374642458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, screen door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) screen door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261158_684912389208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from door (highlighted by a red box), pillow (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739902_15040073320166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), screen door (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) screen door\n(B) chair" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333513_48704486017416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of screen door (annotated by the red box) in relation to shelf?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895448_129501087371291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of washing machine (annotated by the red box) and doormat in the image provided, where is washing machine (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899198_186529772929625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430928_92929573466291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, door (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) door\n(B) counter top" }, { "from": "gpt", "value": "(B) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739331_45502716969166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430442_726451056416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the chair (highlighted by a red box)? Choose among these: linen (highlighted by a blue box) or material (highlighted by a green box).\n(A) linen\n(B) material" }, { "from": "gpt", "value": "(A) linen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828272_84530783898791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or air conditioning (highlighted by a blue box)?\n(A) chair\n(B) air conditioning" }, { "from": "gpt", "value": "(B) air conditioning" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898701_580993993084125_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018003_458218924987458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or side table (highlighted by a blue box)?\n(A) chair\n(B) side table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332810_48138332492166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to food (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and food (highlighted by a green box).\n(A) cabinetry\n(B) food" }, { "from": "gpt", "value": "(B) food" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358406_40707381332166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, cabinetry (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) cabinetry\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331618_17981374719041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from curtain (highlighted by a red box), appliance (highlighted by a blue box) or window (highlighted by a green box)?\n(A) appliance\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115177_104361242360458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from sheet (highlighted by a red box)? Choose from infant bed (highlighted by a blue box) and changing table (highlighted by a green box).\n(A) infant bed\n(B) changing table" }, { "from": "gpt", "value": "(B) changing table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670269_66602813142000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to door (highlighted by a red box), flower (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) flower\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331277_13096344206291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from houseplant (highlighted by a red box)? Choose from fruit (highlighted by a blue box) and mixing bowl (highlighted by a green box).\n(A) fruit\n(B) mixing bowl" }, { "from": "gpt", "value": "(A) fruit" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446048_79981963948541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of screen door (annotated by the red box) in reference to window?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446444_82639015170625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from christmas tree (highlighted by a red box), furniture (highlighted by a blue box) or door (highlighted by a green box)?\n(A) furniture\n(B) door" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444891_104235991475625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cloth (highlighted by a red box)? furniture (highlighted by a blue box) or cloth (highlighted by a green box)?\n(A) furniture\n(B) cloth" }, { "from": "gpt", "value": "(B) cloth" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204726_23673924394958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, curtain (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) curtain\n(B) armchair" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898571_183815098693166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is window (annotated by the red box) located in relation to gift box in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332316_390850665270250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to shelf (highlighted by a red box)? Choose from shelf (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) shelf\n(B) picture frame" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332482_338672314787583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, furniture (highlighted by a red box) or baby carriage (highlighted by a blue box)?\n(A) furniture\n(B) baby carriage" }, { "from": "gpt", "value": "(B) baby carriage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331279_14230086651208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from mouthwash (highlighted by a red box), shelf (highlighted by a blue box) or towel (highlighted by a green box)?\n(A) shelf\n(B) towel" }, { "from": "gpt", "value": "(B) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897462_469931660742458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, furniture (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) furniture\n(B) cardboard box" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115363_1053359491623_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from studio couch (highlighted by a red box)? toy (highlighted by a blue box) or miniature (highlighted by a green box)?\n(A) toy\n(B) miniature" }, { "from": "gpt", "value": "(B) miniature" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896096_144114789018833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or countertop (highlighted by a blue box)?\n(A) chair\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204341_15010908741541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from table (highlighted by a red box)? Select from lamp (highlighted by a blue box) and headboard (highlighted by a green box).\n(A) lamp\n(B) headboard" }, { "from": "gpt", "value": "(B) headboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897954_533721635107291_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429728_19321330135291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to door (highlighted by a red box)? cabinetry (highlighted by a blue box) or door (highlighted by a green box).\n(A) cabinetry\n(B) door" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431090_75922268722541_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331107_135506973655500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from appliance (highlighted by a red box)? Choose among these: basket (highlighted by a blue box) or letter (highlighted by a green box).\n(A) basket\n(B) letter" }, { "from": "gpt", "value": "(A) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662882_16559487737666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, coffee table (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) coffee table\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115575_2523612854125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from table lamp (highlighted by a red box)? chest of drawers (highlighted by a blue box) or cardboard box (highlighted by a green box)?\n(A) chest of drawers\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332295_385524104654500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from furniture (highlighted by a red box), appliance (highlighted by a blue box) or equipment (highlighted by a green box)?\n(A) appliance\n(B) equipment" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458366_100770540147208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, table (highlighted by a red box) or table (highlighted by a blue box)?\n(A) table\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895446_129378787262666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of washing machine (annotated by the red box) and clothing in the image provided, where is washing machine (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828272_84588793189916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669927_14198959735791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from drawer (highlighted by a red box)? table (highlighted by a blue box) or couch (highlighted by a green box)?\n(A) table\n(B) couch" }, { "from": "gpt", "value": "(B) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334615_385661632156833_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358281_9161521092250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, kitchen appliance (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) kitchen appliance\n(B) electric outlet" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897643_146958178029000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, window (highlighted by a red box) or air conditioning (highlighted by a blue box)?\n(A) window\n(B) air conditioning" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663064_38448499155833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cabinetry (highlighted by a red box)? cabinetry (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018751_7135252228916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from table (highlighted by a red box)? houseplant (highlighted by a blue box) or radiator (highlighted by a green box)?\n(A) houseplant\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334912_1089946468137416_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445978_132448681523915_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from radiator (highlighted by a red box)? Select from nightstand (highlighted by a blue box) and table lamp (highlighted by a green box).\n(A) nightstand\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115126_84586937839000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, television (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) television\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898729_583560565759666_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332156_259993526353166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, shelf (highlighted by a red box) or cabinet (highlighted by a blue box)?\n(A) shelf\n(B) cabinet" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899653_233560471743791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from curtain (highlighted by a red box)? curtain (highlighted by a blue box) or mat (highlighted by a green box)?\n(A) curtain\n(B) mat" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796237_2994225036875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from basket (highlighted by a red box)? Select from radiator (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) radiator\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828439_90613941099958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, home appliance (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) home appliance\n(B) picture frame" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670291_62214221426666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from studio couch (highlighted by a red box)? Select from chair (highlighted by a blue box) and studio couch (highlighted by a green box).\n(A) chair\n(B) studio couch" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445677_61021813120166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, shower curtain (highlighted by a red box) or lantern (highlighted by a blue box)?\n(A) shower curtain\n(B) lantern" }, { "from": "gpt", "value": "(A) shower curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334040_278914206609041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, desk (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) desk\n(B) armchair" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430858_74473498052833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from window (highlighted by a red box)? Choose among these: curtain (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) curtain\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828311_76568527862958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the chair (highlighted by a red box)? bottle (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115287_118102036706166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739267_39992179182916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, door (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) door\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331128_174151450956333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from decor (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204678_12478434415500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from book (highlighted by a red box)? Choose from beige (highlighted by a blue box) and chair (highlighted by a green box).\n(A) beige\n(B) chair" }, { "from": "gpt", "value": "(A) beige" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430402_126564393952291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, gas stove (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) gas stove\n(B) bottle" }, { "from": "gpt", "value": "(A) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670133_40019775963958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from radiator (highlighted by a red box)? Choose among these: chest of drawers (highlighted by a blue box) or chest of drawers (highlighted by a green box).\n(A) chest of drawers\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018334_116227011140541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from cabinetry (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898007_219387634965041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, light switch (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) light switch\n(B) counter top" }, { "from": "gpt", "value": "(B) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358167_60835929188875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, studio couch (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) studio couch\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333847_74916632720791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from flower (highlighted by a red box), lamp (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) lamp\n(B) pillow" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261172_1502059975083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is chair (annotated by the red box) located relative to chair? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115384_1760577649666_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895994_136227221234875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261710_1404228835458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, radiator (highlighted by a red box) or sleeping bag (highlighted by a blue box)?\n(A) radiator\n(B) sleeping bag" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331904_627363575364750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from furniture (highlighted by a red box)? clock (highlighted by a blue box) or door (highlighted by a green box)?\n(A) clock\n(B) door" }, { "from": "gpt", "value": "(A) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896396_22562365338250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to chest of drawers (highlighted by a red box)? pillow (highlighted by a blue box) or candle holder (highlighted by a green box).\n(A) pillow\n(B) candle holder" }, { "from": "gpt", "value": "(B) candle holder" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796466_3755805670083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toiletry (highlighted by a red box), mouthwash (highlighted by a blue box) or window sill (highlighted by a green box)?\n(A) mouthwash\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115415_4163560986290_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, oil lamp (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) oil lamp\n(B) chair" }, { "from": "gpt", "value": "(A) oil lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445997_133901463126833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from desk (highlighted by a red box)? Choose from radiator (highlighted by a blue box) and box (highlighted by a green box).\n(A) radiator\n(B) box" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796212_1519461243291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, dresser (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) dresser\n(B) lamp" }, { "from": "gpt", "value": "(A) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663258_77862876980041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from ledge (highlighted by a red box)? mouthwash (highlighted by a blue box) or mouthwash (highlighted by a green box)?\n(A) mouthwash\n(B) mouthwash" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431031_141307758457083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toiletry (highlighted by a red box) or mouthwash (highlighted by a blue box)?\n(A) toiletry\n(B) mouthwash" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896229_5018500765541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, shelve (highlighted by a red box) or soap dispenser (highlighted by a blue box)?\n(A) shelve\n(B) soap dispenser" }, { "from": "gpt", "value": "(B) soap dispenser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115227_95880737009875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to pillow (highlighted by a red box)? window frame (highlighted by a blue box) or plant (highlighted by a green box).\n(A) window frame\n(B) plant" }, { "from": "gpt", "value": "(B) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828441_91462330318500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from chair (highlighted by a red box)? appliance (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358253_6179052624583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to pad (highlighted by a red box)? box (highlighted by a blue box) or christmas tree (highlighted by a green box).\n(A) box\n(B) christmas tree" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115358_4171805542291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, houseplant (highlighted by a red box) or door (highlighted by a blue box)?\n(A) houseplant\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446588_206045151304916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the fireplace (highlighted by a red box)? desk (highlighted by a blue box) or plug (highlighted by a green box).\n(A) desk\n(B) plug" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895972_406443157106000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to shelf (highlighted by a red box)? Select from glass jar (highlighted by a blue box) and desk (highlighted by a green box).\n(A) glass jar\n(B) desk" }, { "from": "gpt", "value": "(A) glass jar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261089_420160726041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from appliance (highlighted by a red box)? Select from shelf (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) shelf\n(B) bottle" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897924_349013833847541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, sink (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) sink\n(B) appliance" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430765_339317458715625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from book (highlighted by a red box)? book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358252_6113645164041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to swivel chair (highlighted by a red box)? table (highlighted by a blue box) or christmas tree (highlighted by a green box).\n(A) table\n(B) christmas tree" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334837_613741249034500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739563_198370156638125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429723_17909850465875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to countertop (highlighted by a red box)? Choose from kitchen appliance (highlighted by a blue box) and gas stove (highlighted by a green box).\n(A) kitchen appliance\n(B) gas stove" }, { "from": "gpt", "value": "(B) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261407_29703607988958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of studio couch (annotated by the red box) in reference to pillow? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334935_663064892435333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the book (highlighted by a red box)? book (highlighted by a blue box) or toy (highlighted by a green box).\n(A) book\n(B) toy" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458572_256176076083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to gas stove (highlighted by a red box)? Choose from kitchen appliance (highlighted by a blue box) and kitchen appliance (highlighted by a green box).\n(A) kitchen appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899953_865627455851333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toiletry (highlighted by a red box)? box (highlighted by a blue box) or crate (highlighted by a green box).\n(A) box\n(B) crate" }, { "from": "gpt", "value": "(B) crate" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828368_92197514114833_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899031_643138321629958_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445044_1578147412791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to pillow (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and studio couch (highlighted by a green box).\n(A) picture frame\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898802_68880392978708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from door (highlighted by a red box)? Select from plain (highlighted by a blue box) and window (highlighted by a green box).\n(A) plain\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444908_106420954406375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115217_94940733853916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, studio couch (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) studio couch\n(B) chair" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429851_12780745536666_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895469_132895924533250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the chair (highlighted by a red box)? chair (highlighted by a blue box) or chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204920_3788890071500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or stairs (highlighted by a blue box)?\n(A) door\n(B) stairs" }, { "from": "gpt", "value": "(B) stairs" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430602_315152225998541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, vanity (highlighted by a red box) or glass box (highlighted by a blue box)?\n(A) vanity\n(B) glass box" }, { "from": "gpt", "value": "(A) vanity" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333493_62575486916583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chest of drawers (highlighted by a red box), plant (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) plant\n(B) furniture" }, { "from": "gpt", "value": "(A) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429855_12698745511791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to toilet (highlighted by a red box)? Choose from ceramic tile (highlighted by a blue box) and doormat (highlighted by a green box).\n(A) ceramic tile\n(B) doormat" }, { "from": "gpt", "value": "(A) ceramic tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204322_16034051719958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from curtain (highlighted by a red box)? Select from table (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) table\n(B) houseplant" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898586_184304186336083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, appliance (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) appliance\n(B) screen door" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896304_6856144464250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115216_95037226936500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to chair (highlighted by a red box)? Choose from table (highlighted by a blue box) and door (highlighted by a green box).\n(A) table\n(B) door" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261344_24299546556250_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898052_223253123024708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window (highlighted by a red box)? Select from radiator (highlighted by a blue box) and chest of drawers (highlighted by a green box).\n(A) radiator\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897607_137247645817874_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhere is window (annotated by the red box) located in relation to plain in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739814_15631651549416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window (highlighted by a red box), window (highlighted by a blue box) or door (highlighted by a green box)?\n(A) window\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898261_696956238237958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, paperback book (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) paperback book\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895279_79265906875041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: table (highlighted by a blue box) or television (highlighted by a green box).\n(A) table\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115363_980271728166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, radiator (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) radiator\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895478_134525717497375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toy (highlighted by a red box)? table (highlighted by a blue box) or window (highlighted by a green box).\n(A) table\n(B) window" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895863_107840162189916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, flower (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) flower\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739699_1603013005500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the screen door (highlighted by a red box)? bidet (highlighted by a blue box) or soap dispenser (highlighted by a green box).\n(A) bidet\n(B) soap dispenser" }, { "from": "gpt", "value": "(A) bidet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331298_14996353272791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cabinet (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) cabinet\n(B) pillow" }, { "from": "gpt", "value": "(A) cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445198_10961023646541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, entertainment center (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) entertainment center\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895919_112009502716958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, treadmill (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) treadmill\n(B) furniture" }, { "from": "gpt", "value": "(A) treadmill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333665_131845197232540_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window (highlighted by a red box), toy (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) toy\n(B) houseplant" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333863_75445847253541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from cabinetry (highlighted by a red box)? tap (highlighted by a blue box) or sink (highlighted by a green box)?\n(A) tap\n(B) sink" }, { "from": "gpt", "value": "(A) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334178_350714667999000_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331615_18069972119250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, desk (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) desk\n(B) bottle" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739301_43637260218250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, countertop (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) countertop\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115575_2537607059458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828565_102122671565250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window (highlighted by a red box) or television (highlighted by a blue box)?\n(A) window\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445723_59185766934291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, home appliance (highlighted by a red box) or tile (highlighted by a blue box)?\n(A) home appliance\n(B) tile" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018804_18864892229958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261087_368865268916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to food (highlighted by a red box)? Select from shelf (highlighted by a blue box) and tableware (highlighted by a green box).\n(A) shelf\n(B) tableware" }, { "from": "gpt", "value": "(B) tableware" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429870_14280573913916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, shelf (highlighted by a red box) or flag (highlighted by a blue box)?\n(A) shelf\n(B) flag" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333281_25582121500958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, floral arrangement (highlighted by a red box) or nightstand (highlighted by a blue box)?\n(A) floral arrangement\n(B) nightstand" }, { "from": "gpt", "value": "(A) floral arrangement" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018746_7226765048375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of table (annotated by the red box) in reference to houseplant?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331910_627569875702416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of pillow (annotated by the red box) in relation to material? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670288_62139217753875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to couch (highlighted by a red box)? table lamp (highlighted by a blue box) or nightstand (highlighted by a green box).\n(A) table lamp\n(B) nightstand" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896063_132140997673583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to table (highlighted by a red box), appliance (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018537_828115640678541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) picture frame\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331606_18435997764791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from toiletry (highlighted by a red box)? Choose among these: bottle (highlighted by a blue box) or toiletry (highlighted by a green box).\n(A) bottle\n(B) toiletry" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333110_108798379754041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the radiator (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or home appliance (highlighted by a green box).\n(A) appliance\n(B) home appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333612_76194442162166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334834_613856752229583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bed (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) bed\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429851_12776747160750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430212_688703354946583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is gadget (annotated by the red box) located relative to houseplant? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739315_44723916694583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, animal (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) animal\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331686_6578304903083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window (highlighted by a red box), door (highlighted by a blue box) or armchair (highlighted by a green box)?\n(A) door\n(B) armchair" }, { "from": "gpt", "value": "(B) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663349_91010809962625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cabinetry (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) cabinetry\n(B) concrete" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796514_3265214794458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from screen door (highlighted by a red box)? Select from table lamp (highlighted by a blue box) and table lamp (highlighted by a green box).\n(A) table lamp\n(B) table lamp" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670124_41658482375750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window (highlighted by a red box) or coffee cup (highlighted by a blue box)?\n(A) window\n(B) coffee cup" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261544_75107264856541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cleaning product (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) cleaning product\n(B) toilet paper" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204506_676458316291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739948_17273417169958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from oven (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or oven (highlighted by a green box).\n(A) cabinetry\n(B) oven" }, { "from": "gpt", "value": "(B) oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358241_10554717165416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from screen door (highlighted by a red box), cleaning product (highlighted by a blue box) or bathtub (highlighted by a green box)?\n(A) cleaning product\n(B) bathtub" }, { "from": "gpt", "value": "(B) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739699_1591001091541_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the counter top (highlighted by a red box)? Choose among these: bathtub (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) bathtub\n(B) screen door" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896096_144190790834125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to screen door (highlighted by a red box)? Choose from computer keyboard (highlighted by a blue box) and mousepad (highlighted by a green box).\n(A) computer keyboard\n(B) mousepad" }, { "from": "gpt", "value": "(B) mousepad" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739595_199676683097208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chest of drawers (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) chest of drawers\n(B) armchair" }, { "from": "gpt", "value": "(B) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018552_830324332538041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from nightstand (highlighted by a red box)? pillow (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333310_28220646012833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from counter (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) appliance\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204329_14361609387208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to table (highlighted by a red box), fireplace (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) fireplace\n(B) houseplant" }, { "from": "gpt", "value": "(A) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670174_42271410334083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from chair (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or table (highlighted by a green box).\n(A) cabinetry\n(B) table" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331920_630846291184458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, cardboard box (highlighted by a red box) or laundry (highlighted by a blue box)?\n(A) cardboard box\n(B) laundry" }, { "from": "gpt", "value": "(A) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895635_471919700815791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897971_216929462062125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is screen door (annotated by the red box) located in relation to waste container in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796744_28846077564375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or window (highlighted by a blue box)?\n(A) picture frame\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204304_15100173496583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to studio couch (highlighted by a red box)? Select from pillow (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895829_1221681815739000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to storage box (highlighted by a red box), skateboard (highlighted by a blue box) or screen door (highlighted by a green box)?\n(A) skateboard\n(B) screen door" }, { "from": "gpt", "value": "(A) skateboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898348_509441012578375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toilet paper (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) toilet paper\n(B) picture frame" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445691_57461382720750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the storage box (highlighted by a red box)? Choose among these: cardboard box (highlighted by a blue box) or clothing (highlighted by a green box).\n(A) cardboard box\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261158_640913157958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from curtain (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899955_865598851035458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from footwear (highlighted by a red box)? Select from dirt (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) dirt\n(B) cabinetry" }, { "from": "gpt", "value": "(A) dirt" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204291_14496098209000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toaster (highlighted by a red box), home appliance (highlighted by a blue box) or infant bed (highlighted by a green box)?\n(A) home appliance\n(B) infant bed" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444696_72512771494291_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261555_75437176452916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) door\n(B) radiator" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796438_688614753250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chest of drawers (highlighted by a red box) or television (highlighted by a blue box)?\n(A) chest of drawers\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358386_19162743137083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from desk (highlighted by a red box)? Select from houseplant (highlighted by a blue box) and chair (highlighted by a green box).\n(A) houseplant\n(B) chair" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333994_50490773124125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, shaving cream (highlighted by a red box) or cabinet (highlighted by a blue box)?\n(A) shaving cream\n(B) cabinet" }, { "from": "gpt", "value": "(A) shaving cream" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204656_10841668880750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to appliance (highlighted by a red box), crock pot (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) crock pot\n(B) shelf" }, { "from": "gpt", "value": "(A) crock pot" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445040_1813036236833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from couple (highlighted by a red box)? Choose among these: magazine (highlighted by a blue box) or drawer (highlighted by a green box).\n(A) magazine\n(B) drawer" }, { "from": "gpt", "value": "(A) magazine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445612_56472010231250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) chair\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445695_57390278600083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, backpack (highlighted by a red box) or box (highlighted by a blue box)?\n(A) backpack\n(B) box" }, { "from": "gpt", "value": "(A) backpack" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358243_10427120043416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toiletry (highlighted by a red box), sink (highlighted by a blue box) or basket (highlighted by a green box)?\n(A) sink\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332201_264286274884541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, refrigerator (highlighted by a red box) or grocery bag (highlighted by a blue box)?\n(A) refrigerator\n(B) grocery bag" }, { "from": "gpt", "value": "(B) grocery bag" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663368_92551499179875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, radiator (highlighted by a red box) or blind (highlighted by a blue box)?\n(A) radiator\n(B) blind" }, { "from": "gpt", "value": "(B) blind" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429804_737633824680125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from plant (highlighted by a red box)? wine rack (highlighted by a blue box) or wine rack (highlighted by a green box)?\n(A) wine rack\n(B) wine rack" }, { "from": "gpt", "value": "(A) wine rack" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739267_39982183318625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to door (highlighted by a red box)? Select from window (highlighted by a blue box) and barn door (highlighted by a green box).\n(A) window\n(B) barn door" }, { "from": "gpt", "value": "(B) barn door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334052_85568540439666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from beach towel (highlighted by a red box)? microwave oven (highlighted by a blue box) or beach towel (highlighted by a green box)?\n(A) microwave oven\n(B) beach towel" }, { "from": "gpt", "value": "(A) microwave oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333806_51265946961958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to book (highlighted by a red box), shower curtain (highlighted by a blue box) or book (highlighted by a green box)?\n(A) shower curtain\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899118_129882276489541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670150_40455636640541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from dresser (highlighted by a red box), vase (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) vase\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649720_48006953992125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, gas stove (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) gas stove\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354787023914416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from book (highlighted by a red box)? Choose from book (highlighted by a blue box) and book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358362_16228163697708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the furniture (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) book\n(B) curtain" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445168_7918525884500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, light fixture (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) light fixture\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204800_24097127214291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of door (annotated by the red box) in relation to door?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333778_48311741307125_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261331_24066934857666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, toilet (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) toilet\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334914_1090119864955000_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260890_8710207310958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from mirror (highlighted by a red box)? bath (highlighted by a blue box) or toiletry (highlighted by a green box)?\n(A) bath\n(B) toiletry" }, { "from": "gpt", "value": "(A) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332599_362944524514458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is door (annotated by the red box) located relative to plain? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796366_10554444756666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of shelf (annotated by the red box) in relation to picnic basket?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358693_3112714779083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from door (highlighted by a red box)? Select from mirror (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) mirror\n(B) picture frame" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458690_135410791086874_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to chair (highlighted by a red box)? Select from chair (highlighted by a blue box) and table (highlighted by a green box).\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895994_136225205404875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), pillow (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739574_198410257454416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to desk (highlighted by a red box)? picture frame (highlighted by a blue box) or handbag (highlighted by a green box).\n(A) picture frame\n(B) handbag" }, { "from": "gpt", "value": "(B) handbag" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430310_264936240793708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the studio couch (highlighted by a red box)? Choose among these: radiator (highlighted by a blue box) or chair (highlighted by a green box).\n(A) radiator\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662891_19485502951583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, ball (highlighted by a red box) or projection screen (highlighted by a blue box)?\n(A) ball\n(B) projection screen" }, { "from": "gpt", "value": "(B) projection screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444768_81538774175375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhere is bed (annotated by the red box) located in relation to electric outlet in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897634_139597955519791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, mirror (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) mirror\n(B) bed" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670232_52833379067583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, soap dispenser (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) soap dispenser\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446048_79985962285208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, teddy bear (highlighted by a red box) or door (highlighted by a blue box)?\n(A) teddy bear\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895896_109592422522875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from shower (highlighted by a red box)? mirror (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) mirror\n(B) houseplant" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739344_46030720838166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to door (highlighted by a red box)? chest of drawers (highlighted by a blue box) or furniture (highlighted by a green box).\n(A) chest of drawers\n(B) furniture" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899002_640942824318583_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669851_12491846990000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the door (highlighted by a red box)? Choose among these: elevator (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) elevator\n(B) picture frame" }, { "from": "gpt", "value": "(A) elevator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332201_264260268753916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to couch (highlighted by a red box)? Select from shelf (highlighted by a blue box) and couch (highlighted by a green box).\n(A) shelf\n(B) couch" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333104_108748083505125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, cabinetry (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) cabinetry\n(B) bottle" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796520_4061805694291_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897822_132898286271041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of pillow (annotated by the red box) and pillow in the image provided, where is pillow (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24888502494208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, person (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) person\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896031_129139830489583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from book (highlighted by a red box), door (highlighted by a blue box) or coffee table (highlighted by a green box)?\n(A) door\n(B) coffee table" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332473_886536175222583_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204857_1579626037083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to light fixture (highlighted by a red box)? Select from mirror (highlighted by a blue box) and light fixture (highlighted by a green box).\n(A) mirror\n(B) light fixture" }, { "from": "gpt", "value": "(B) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458260_74295047684083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cardboard box (highlighted by a red box)? box (highlighted by a blue box) or storage box (highlighted by a green box)?\n(A) box\n(B) storage box" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018844_649845309485208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from shelf (highlighted by a red box), bottle (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333055_60250989823125_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204724_23550525638666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or refrigerator (highlighted by a green box).\n(A) door\n(B) refrigerator" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898621_758030309667916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is lighting (annotated by the red box) located relative to mirror? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895826_1219987677093208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, drawer (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) drawer\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896461_21767693928875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from toilet (highlighted by a red box)? shower (highlighted by a blue box) or window (highlighted by a green box)?\n(A) shower\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649426_10833416093291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, countertop (highlighted by a red box) or chocolate cake (highlighted by a blue box)?\n(A) countertop\n(B) chocolate cake" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739899_14892981456958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, washing machine (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) washing machine\n(B) cabinetry" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204329_14353612547750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from clothing (highlighted by a red box)? Choose among these: clothing (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) clothing\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430599_315414318276250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, fireplace (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) fireplace\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895298_91033130226375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the television (highlighted by a red box)? table (highlighted by a blue box) or desk (highlighted by a green box).\n(A) table\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669901_12087922366625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to studio couch (highlighted by a red box), pillow (highlighted by a blue box) or throw pillow (highlighted by a green box)?\n(A) pillow\n(B) throw pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431151_350872169044958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, dresser (highlighted by a red box) or stationery (highlighted by a blue box)?\n(A) dresser\n(B) stationery" }, { "from": "gpt", "value": "(B) stationery" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828366_92080429287875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, studio couch (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) studio couch\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649634_39395953904083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to window screen (highlighted by a red box)? Choose from studio couch (highlighted by a blue box) and window (highlighted by a green box).\n(A) studio couch\n(B) window" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649605_36429817261750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796464_3560603176583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, toilet (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) toilet\n(B) window screen" }, { "from": "gpt", "value": "(A) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018872_653496386878083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or window (highlighted by a blue box)?\n(A) chair\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331518_190812177527583_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899821_254731846265291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669968_27649200619541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from faucet (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204449_23028982165375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window (highlighted by a red box) or blind (highlighted by a blue box)?\n(A) window\n(B) blind" }, { "from": "gpt", "value": "(B) blind" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47330995_176949691957916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, laptop (highlighted by a red box) or swivel chair (highlighted by a blue box)?\n(A) laptop\n(B) swivel chair" }, { "from": "gpt", "value": "(A) laptop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649598_35826913688291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to lamp (highlighted by a red box), pillow (highlighted by a blue box) or coffee cup (highlighted by a green box)?\n(A) pillow\n(B) coffee cup" }, { "from": "gpt", "value": "(B) coffee cup" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333812_52156463213000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from mouse (highlighted by a red box)? computer monitor (highlighted by a blue box) or computer desk (highlighted by a green box)?\n(A) computer monitor\n(B) computer desk" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739689_1083034818541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to studio couch (highlighted by a red box), pillow (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898530_181122764321916_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445100_9184785732458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, pillow (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) pillow\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471619820500583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the window screen (highlighted by a red box)? Choose among these: clock (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) clock\n(B) cabinetry" }, { "from": "gpt", "value": "(A) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445639_58334782267166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896043_130101941430375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window blind (highlighted by a red box)? Select from radiator (highlighted by a blue box) and toilet (highlighted by a green box).\n(A) radiator\n(B) toilet" }, { "from": "gpt", "value": "(B) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828272_84582779016333_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430314_264829050934207_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334938_663159287506875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chair (highlighted by a red box)? houseplant (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) houseplant\n(B) chair" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018845_649718011242125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the file cabinet (highlighted by a red box)? Choose among these: electric outlet (highlighted by a blue box) or light switch (highlighted by a green box).\n(A) electric outlet\n(B) light switch" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447203_88069087562916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, television (highlighted by a red box) or magazine (highlighted by a blue box)?\n(A) television\n(B) magazine" }, { "from": "gpt", "value": "(B) magazine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332316_390903077413083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the stool (highlighted by a red box)? platter (highlighted by a blue box) or stool (highlighted by a green box).\n(A) platter\n(B) stool" }, { "from": "gpt", "value": "(B) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896096_144244785089208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, box (highlighted by a red box) or window frame (highlighted by a blue box)?\n(A) box\n(B) window frame" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899002_640854127518875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of waste container (annotated by the red box) and footwear in the image provided, where is waste container (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737725021255583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from shelf (highlighted by a red box), wine rack (highlighted by a blue box) or beer bottle (highlighted by a green box)?\n(A) wine rack\n(B) beer bottle" }, { "from": "gpt", "value": "(B) beer bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662875_14419369430875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, table (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) table\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897462_470090061896500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from coffee table (highlighted by a red box)? Select from remote (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) remote\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261343_23992051487500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the exhaust hood (highlighted by a red box)? Choose among these: kitchen appliance (highlighted by a blue box) or swivel chair (highlighted by a green box).\n(A) kitchen appliance\n(B) swivel chair" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430592_311073906201458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to glass vase (highlighted by a red box)? radiator (highlighted by a blue box) or window sill (highlighted by a green box).\n(A) radiator\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446558_86706968164041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, footwear (highlighted by a red box) or door (highlighted by a blue box)?\n(A) footwear\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897948_351343917065625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the radiator (highlighted by a red box)? Choose among these: studio couch (highlighted by a blue box) or furniture (highlighted by a green box).\n(A) studio couch\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430092_28738177182958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of toy (annotated by the red box) and toy in the image provided, where is toy (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828552_101530718134083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331680_6715399066416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) window\n(B) window sill" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430294_187531948221250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, screen door (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) screen door\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430776_338948941700291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from bathtub (highlighted by a red box)? Select from cleaning product (highlighted by a blue box) and cleaning product (highlighted by a green box).\n(A) cleaning product\n(B) cleaning product" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897859_529566160435500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, curtain (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) curtain\n(B) doormat" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895274_79080915176333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from desk (highlighted by a red box)? Choose from book (highlighted by a blue box) and paperback book (highlighted by a green box).\n(A) book\n(B) paperback book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896404_16673220210832_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the beach towel (highlighted by a red box)? table (highlighted by a blue box) or window (highlighted by a green box).\n(A) table\n(B) window" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828369_92308918006875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261313_22289834612250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bottle (highlighted by a red box)? Choose among these: studio couch (highlighted by a blue box) or vase (highlighted by a green box).\n(A) studio couch\n(B) vase" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358257_6846883993416_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899202_186836878706875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to chest of drawers (highlighted by a red box)? Choose from microwave oven (highlighted by a blue box) and vanity (highlighted by a green box).\n(A) microwave oven\n(B) vanity" }, { "from": "gpt", "value": "(A) microwave oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018296_800235608493125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to sink (highlighted by a red box)? Choose from tap (highlighted by a blue box) and sink (highlighted by a green box).\n(A) tap\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444588_31769303461625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to art (highlighted by a red box)? Select from countertop (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) countertop\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204658_10721266495916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from glass bowl (highlighted by a red box)? Select from window sill (highlighted by a blue box) and orange (highlighted by a green box).\n(A) window sill\n(B) orange" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115504_12330318977125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or window (highlighted by a blue box)?\n(A) door\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261392_27829572703083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, lamp (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) lamp\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430236_181773977121083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bath towel (highlighted by a red box)? Choose among these: bath towel (highlighted by a blue box) or sink (highlighted by a green box).\n(A) bath towel\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445040_1799041871958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, appliance (highlighted by a red box) or frying pan (highlighted by a blue box)?\n(A) appliance\n(B) frying pan" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897735_115175686850708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to basket (highlighted by a red box)? Select from bath towel (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) bath towel\n(B) curtain" }, { "from": "gpt", "value": "(A) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898388_367910296655208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the appliance (highlighted by a red box)? box (highlighted by a blue box) or suitcase (highlighted by a green box).\n(A) box\n(B) suitcase" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445081_5497025314000_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331216_281071048505291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, elevator (highlighted by a red box) or barn door (highlighted by a blue box)?\n(A) elevator\n(B) barn door" }, { "from": "gpt", "value": "(B) barn door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896133_147117418347958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from window (highlighted by a red box)? lamp (highlighted by a blue box) or droplight (highlighted by a green box)?\n(A) lamp\n(B) droplight" }, { "from": "gpt", "value": "(B) droplight" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896103_145346915012458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) pillow\n(B) shelf" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739628_1857670146583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) door\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895863_107878163093958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, speaker (highlighted by a red box) or plant (highlighted by a blue box)?\n(A) speaker\n(B) plant" }, { "from": "gpt", "value": "(B) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649688_36020453415583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the towel (highlighted by a red box)? door (highlighted by a blue box) or dress (highlighted by a green box).\n(A) door\n(B) dress" }, { "from": "gpt", "value": "(B) dress" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333115_114248952016125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444869_97896777233791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from christmas tree (highlighted by a red box)? Choose among these: window screen (highlighted by a blue box) or candle holder (highlighted by a green box).\n(A) window screen\n(B) candle holder" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332792_47332295147083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to appliance (highlighted by a red box), appliance (highlighted by a blue box) or chest of drawers (highlighted by a green box)?\n(A) appliance\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896396_22592769425708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of rail (annotated by the red box) and curtain in the image provided, where is rail (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333043_59583451680583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, appliance (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) appliance\n(B) cleaning product" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897939_351289206307333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or christmas decoration (highlighted by a blue box)?\n(A) table\n(B) christmas decoration" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899034_643204927454333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from dumbbell (highlighted by a red box), furniture (highlighted by a blue box) or throw pillow (highlighted by a green box)?\n(A) furniture\n(B) throw pillow" }, { "from": "gpt", "value": "(B) throw pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334515_64446265782333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, towel/napkin (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) towel/napkin\n(B) cabinetry" }, { "from": "gpt", "value": "(A) towel/napkin" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261294_16268830366250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from book (highlighted by a red box)? shelf (highlighted by a blue box) or paperback book (highlighted by a green box)?\n(A) shelf\n(B) paperback book" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115573_2624104543875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the chest of drawers (highlighted by a red box)? drawer (highlighted by a blue box) or swivel chair (highlighted by a green box).\n(A) drawer\n(B) swivel chair" }, { "from": "gpt", "value": "(A) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895482_134649017312040_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the toy (highlighted by a red box)? toy (highlighted by a blue box) or toy (highlighted by a green box).\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333110_108775888884625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhere is shelf (annotated by the red box) located in relation to letter in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458231_78604004557208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, cleaning product (highlighted by a red box) or fruit (highlighted by a blue box)?\n(A) cleaning product\n(B) fruit" }, { "from": "gpt", "value": "(B) fruit" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018328_116001901895541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of light (annotated by the red box) and exhaust hood in the image provided, where is light (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898984_824307493149291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, computer monitor (highlighted by a red box) or power outlet (highlighted by a blue box)?\n(A) computer monitor\n(B) power outlet" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898716_582151250377541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, sink (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) sink\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332467_886342769848833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670311_64328841073083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window sill (highlighted by a red box) or swivel chair (highlighted by a blue box)?\n(A) window sill\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334912_1089944468941291_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430236_181836984845916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to tablecloth (highlighted by a red box)? ceramic tile (highlighted by a blue box) or basin (highlighted by a green box).\n(A) ceramic tile\n(B) basin" }, { "from": "gpt", "value": "(B) basin" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018825_647325368528916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from blanket (highlighted by a red box)? storage box (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) storage box\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669968_27683203202666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the window (highlighted by a red box)? Choose among these: table (highlighted by a blue box) or door (highlighted by a green box).\n(A) table\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898510_160679694711708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261672_2982251720416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bed (highlighted by a red box)? door (highlighted by a blue box) or door (highlighted by a green box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896244_7678188411416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, shelf (highlighted by a red box) or cabinet (highlighted by a blue box)?\n(A) shelf\n(B) cabinet" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430100_29181957141583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to tap (highlighted by a red box)? Choose from mouthwash (highlighted by a blue box) and mouthwash (highlighted by a green box).\n(A) mouthwash\n(B) mouthwash" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739821_16240190806000_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332320_390792772001541_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from curtain (highlighted by a red box)? glass plate (highlighted by a blue box) or glass plate (highlighted by a green box)?\n(A) glass plate\n(B) glass plate" }, { "from": "gpt", "value": "(B) glass plate" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895904_110637337146416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or tripod (highlighted by a blue box)?\n(A) chair\n(B) tripod" }, { "from": "gpt", "value": "(B) tripod" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898393_369438016866875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) door\n(B) cabinetry" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896215_4254941495125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the curtain (highlighted by a red box)? Choose among these: bed (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) bed\n(B) pillow" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896199_142375141562000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, mirror (highlighted by a red box) or window frame (highlighted by a blue box)?\n(A) mirror\n(B) window frame" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446446_82512115377833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, wood burning stove (highlighted by a red box) or candle holder (highlighted by a blue box)?\n(A) wood burning stove\n(B) candle holder" }, { "from": "gpt", "value": "(A) wood burning stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334917_1090070268285166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, laundry (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) laundry\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649722_48899914785291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of door (annotated by the red box) in reference to radiator? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898256_696464040568791_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204656_10818378094041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to appliance (highlighted by a red box)? electric outlet (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) electric outlet\n(B) cabinetry" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331928_163317186727791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) table\n(B) sink" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333674_134267755527041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to book (highlighted by a red box)? desk (highlighted by a blue box) or bed (highlighted by a green box).\n(A) desk\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018634_635948670298541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, cabinetry (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) cabinetry\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430239_181580272271833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is curtain (annotated by the red box) located relative to towel? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332599_362905723528166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, home appliance (highlighted by a red box) or door (highlighted by a blue box)?\n(A) home appliance\n(B) door" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018149_372816795753208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, box (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) box\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739850_17229730364500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, studio couch (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) studio couch\n(B) concrete" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333493_62533687226750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) furniture\n(B) radiator" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663250_75086078508583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, paperback book (highlighted by a red box) or table (highlighted by a blue box)?\n(A) paperback book\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739329_45613720983875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the dresser (highlighted by a red box)? clothing (highlighted by a blue box) or chest of drawers (highlighted by a green box).\n(A) clothing\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447275_408673609982791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, shelf (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) shelf\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334912_1090024470070875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from laundry (highlighted by a red box)? clothesline (highlighted by a blue box) or countertop (highlighted by a green box)?\n(A) clothesline\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334148_142835127290458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is pillow (annotated by the red box) located relative to clothing? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739850_17197726982249_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the wheel (highlighted by a red box)? Choose among these: plant (highlighted by a blue box) or animal (highlighted by a green box).\n(A) plant\n(B) animal" }, { "from": "gpt", "value": "(B) animal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444875_99389640565875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to christmas tree (highlighted by a red box)? Select from window sill (highlighted by a blue box) and window screen (highlighted by a green box).\n(A) window sill\n(B) window screen" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115394_3270860680666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or entertainment center (highlighted by a blue box)?\n(A) picture frame\n(B) entertainment center" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898587_184493777958958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018523_821405490714750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bed (highlighted by a red box)? nightstand (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649603_36019600473208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to television (highlighted by a red box)? equipment (highlighted by a blue box) or gadget (highlighted by a green box).\n(A) equipment\n(B) gadget" }, { "from": "gpt", "value": "(B) gadget" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334202_103330198024458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from pillow (highlighted by a red box)? Choose among these: table (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) table\n(B) studio couch" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670201_53354609922083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115238_97776868813625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354645032070000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from desk (highlighted by a red box)? shelf (highlighted by a blue box) or table (highlighted by a green box)?\n(A) shelf\n(B) table" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739641_2233858753291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bath (highlighted by a red box)? Choose from toilet paper (highlighted by a blue box) and porcelain (highlighted by a green box).\n(A) toilet paper\n(B) porcelain" }, { "from": "gpt", "value": "(B) porcelain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649609_36562712108791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from desk (highlighted by a red box)? Choose from bed frame (highlighted by a blue box) and gadget (highlighted by a green box).\n(A) bed frame\n(B) gadget" }, { "from": "gpt", "value": "(A) bed frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471409824556666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, extinguisher (highlighted by a red box) or waste container (highlighted by a blue box)?\n(A) extinguisher\n(B) waste container" }, { "from": "gpt", "value": "(B) waste container" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333875_76123478995250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, desk (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) desk\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897422_104059220186833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), table lamp (highlighted by a blue box) or wall clock (highlighted by a green box)?\n(A) table lamp\n(B) wall clock" }, { "from": "gpt", "value": "(B) wall clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334139_142697932798833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from pillow (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and book (highlighted by a green box).\n(A) furniture\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358728_6526320883458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from window screen (highlighted by a red box)? picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333298_26644440327333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204726_23663911890000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the extension cord (highlighted by a red box)? Choose among these: basket (highlighted by a blue box) or table (highlighted by a green box).\n(A) basket\n(B) table" }, { "from": "gpt", "value": "(A) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458260_74295047684083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, storage box (highlighted by a red box) or storage box (highlighted by a blue box)?\n(A) storage box\n(B) storage box" }, { "from": "gpt", "value": "(A) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018900_655464882676833_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431151_350848162233375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444738_77964394930833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to studio couch (highlighted by a red box)? curtain (highlighted by a blue box) or door (highlighted by a green box).\n(A) curtain\n(B) door" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663368_92558396451583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, furniture (highlighted by a red box) or table (highlighted by a blue box)?\n(A) furniture\n(B) table" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018760_15041360366750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window (highlighted by a red box) or window (highlighted by a blue box)?\n(A) window\n(B) window" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333463_57290562938375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, balloon (highlighted by a red box) or balloon (highlighted by a blue box)?\n(A) balloon\n(B) balloon" }, { "from": "gpt", "value": "(B) balloon" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896550_30125291151041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from pillow (highlighted by a red box)? Choose among these: bed (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) bed\n(B) pillow" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897655_147155781527125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) table\n(B) appliance" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018828_647408967993833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from furniture (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and glass door (highlighted by a green box).\n(A) picture frame\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358168_61176027982375_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334941_664725286326291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to door (highlighted by a red box)? garage door (highlighted by a blue box) or bicycle (highlighted by a green box).\n(A) garage door\n(B) bicycle" }, { "from": "gpt", "value": "(B) bicycle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444588_31763305891583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, electric outlet (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) electric outlet\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458202_74747065427791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the pillow (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261455_35831442199083_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445997_133917456553833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from toaster (highlighted by a red box)? Choose from appliance (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895595_1161365184565791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to cabinetry (highlighted by a red box), plant (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) plant\n(B) curtain" }, { "from": "gpt", "value": "(A) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358380_18936849669791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to curtain (highlighted by a red box)? Choose from chair (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895186_37702268067916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332401_405989463625208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, blanket (highlighted by a red box) or table (highlighted by a blue box)?\n(A) blanket\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332990_125281297656416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670074_38614514530291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) window\n(B) furniture" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896256_8053433358833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bathtub (highlighted by a red box) or garden hose (highlighted by a blue box)?\n(A) bathtub\n(B) garden hose" }, { "from": "gpt", "value": "(B) garden hose" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739850_17221717024916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from chest of drawers (highlighted by a red box)? Select from curtain (highlighted by a blue box) and table lamp (highlighted by a green box).\n(A) curtain\n(B) table lamp" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670063_37993514338166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or remote control (highlighted by a blue box)?\n(A) chair\n(B) remote control" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429774_360085617196041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the lamp (highlighted by a red box)? Choose among these: furniture (highlighted by a blue box) or bed (highlighted by a green box).\n(A) furniture\n(B) bed" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663415_95824667873708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, desk (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) desk\n(B) picture frame" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334205_103952972584791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, shelf (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) shelf\n(B) houseplant" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334837_613731253078333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cabinetry (highlighted by a red box)? Choose from shelf (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) shelf\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331587_15989979963375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, knob (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) knob\n(B) toy" }, { "from": "gpt", "value": "(A) knob" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115166_88056275954583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to cleaning product (highlighted by a red box), tap (highlighted by a blue box) or bidet (highlighted by a green box)?\n(A) tap\n(B) bidet" }, { "from": "gpt", "value": "(A) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261390_27739275072083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to bottle (highlighted by a red box), mirror (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) mirror\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115648_4791652855083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of flower (annotated by the red box) in relation to chair? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115199_94468742464208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from pillow (highlighted by a red box)? Select from nightstand (highlighted by a blue box) and bed (highlighted by a green box).\n(A) nightstand\n(B) bed" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334471_102417950971583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, countertop (highlighted by a red box) or fruit (highlighted by a blue box)?\n(A) countertop\n(B) fruit" }, { "from": "gpt", "value": "(B) fruit" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895623_470765042929875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, washing machine (highlighted by a red box) or power plugs and sockets (highlighted by a blue box)?\n(A) washing machine\n(B) power plugs and sockets" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115127_84774943368125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cabinetry (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) cabinetry\n(B) pillow" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24425809182375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from chair (highlighted by a red box)? Select from book (highlighted by a blue box) and side table (highlighted by a green box).\n(A) book\n(B) side table" }, { "from": "gpt", "value": "(B) side table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896490_31550335350791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, toilet paper (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) toilet paper\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332751_42637721041125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from bottle (highlighted by a red box)? Select from paper towel (highlighted by a blue box) and kettle (highlighted by a green box).\n(A) paper towel\n(B) kettle" }, { "from": "gpt", "value": "(B) kettle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115227_95966834495750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the remote (highlighted by a red box)? cardboard box (highlighted by a blue box) or remote (highlighted by a green box).\n(A) cardboard box\n(B) remote" }, { "from": "gpt", "value": "(B) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896247_7613082136791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the screen door (highlighted by a red box)? Choose among these: radiator (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) radiator\n(B) curtain" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204303_15005579388041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the table (highlighted by a red box)? bowl (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) bowl\n(B) cabinetry" }, { "from": "gpt", "value": "(A) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358378_19066947842750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) picture frame\n(B) curtain" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649714_47790644000125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, cabinetry (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) cabinetry\n(B) home appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895272_79414313214750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018817_20109038874083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, washing machine (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) washing machine\n(B) bath towel" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261248_15202797077750_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796189_298634891208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to table (highlighted by a red box)? Select from bed (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) bed\n(B) bottle" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333863_75431852936791_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115376_1815289338875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from crate (highlighted by a red box)? Select from chest of drawers (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) chest of drawers\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899198_186495787005333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, wall clock (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) wall clock\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458703_136718468642166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from appliance (highlighted by a red box)? bottle (highlighted by a blue box) or faucet (highlighted by a green box)?\n(A) bottle\n(B) faucet" }, { "from": "gpt", "value": "(B) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261357_25854221559375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, refrigerator (highlighted by a red box) or door (highlighted by a blue box)?\n(A) refrigerator\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331507_155062220262916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from curtain (highlighted by a red box)? window (highlighted by a blue box) or bed frame (highlighted by a green box)?\n(A) window\n(B) bed frame" }, { "from": "gpt", "value": "(B) bed frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429750_355500381370458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the book (highlighted by a red box)? Choose among these: bookcase (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) bookcase\n(B) picture frame" }, { "from": "gpt", "value": "(A) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204828_28525625857833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: couch (highlighted by a blue box) or chair (highlighted by a green box).\n(A) couch\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739825_16160590425916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, television (highlighted by a red box) or window (highlighted by a blue box)?\n(A) television\n(B) window" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261169_1303171938833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333803_51548848626041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from cabinetry (highlighted by a red box)? desk (highlighted by a blue box) or toy (highlighted by a green box)?\n(A) desk\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430294_187541960830250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) chair\n(B) counter top" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332401_406023366405291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from candle holder (highlighted by a red box)? Select from oval (highlighted by a blue box) and chair (highlighted by a green box).\n(A) oval\n(B) chair" }, { "from": "gpt", "value": "(A) oval" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445799_67025112969541_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897587_134935346973707_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from coffee machine (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796684_30833146139458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, appliance (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) appliance\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260892_8801202831708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bathtub (highlighted by a red box) or soap dispenser (highlighted by a blue box)?\n(A) bathtub\n(B) soap dispenser" }, { "from": "gpt", "value": "(B) soap dispenser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895824_1219934681756541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table lamp (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) table lamp\n(B) studio couch" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898723_582892066080208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, curtain (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) curtain\n(B) window sill" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115416_4087757626875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from pillow (highlighted by a red box)? pillow (highlighted by a blue box) or cat bed (highlighted by a green box)?\n(A) pillow\n(B) cat bed" }, { "from": "gpt", "value": "(B) cat bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739313_44876003739125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to animal (highlighted by a red box)? Select from fireplace (highlighted by a blue box) and fireplace (highlighted by a green box).\n(A) fireplace\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444588_31755309130708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, coffee machine (highlighted by a red box) or oven (highlighted by a blue box)?\n(A) coffee machine\n(B) oven" }, { "from": "gpt", "value": "(A) coffee machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458262_74209148303666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the clothesline (highlighted by a red box)? Choose among these: clothing (highlighted by a blue box) or trousers (highlighted by a green box).\n(A) clothing\n(B) trousers" }, { "from": "gpt", "value": "(A) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669854_12623459112708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, paperback book (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) paperback book\n(B) paperback book" }, { "from": "gpt", "value": "(A) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332396_401332813017333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from cabinetry (highlighted by a red box)? home appliance (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) home appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334947_664789293555041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from pillow (highlighted by a red box)? pillow (highlighted by a blue box) or nightstand (highlighted by a green box)?\n(A) pillow\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897681_148456999294375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649714_47878657425125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the cage (highlighted by a red box)? armchair (highlighted by a blue box) or chair (highlighted by a green box).\n(A) armchair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897713_111862407166333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from fridge (highlighted by a red box)? armchair (highlighted by a blue box) or armchair (highlighted by a green box)?\n(A) armchair\n(B) armchair" }, { "from": "gpt", "value": "(A) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333206_48222578482208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from mouthwash (highlighted by a red box), toiletry (highlighted by a blue box) or toiletry (highlighted by a green box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896482_23873608506208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is stool (annotated by the red box) located in relation to door in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204524_1594475451208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or paper bag (highlighted by a blue box)?\n(A) door\n(B) paper bag" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670291_62356615065208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, computer monitor (highlighted by a red box) or candle holder (highlighted by a blue box)?\n(A) computer monitor\n(B) candle holder" }, { "from": "gpt", "value": "(B) candle holder" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332158_260225732342666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to screen door (highlighted by a red box), box (highlighted by a blue box) or box (highlighted by a green box)?\n(A) box\n(B) box" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430931_92911380873250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, human face (highlighted by a red box) or person (highlighted by a blue box)?\n(A) human face\n(B) person" }, { "from": "gpt", "value": "(B) person" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018846_649933706810416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to gas stove (highlighted by a red box)? paper towel (highlighted by a blue box) or toaster (highlighted by a green box).\n(A) paper towel\n(B) toaster" }, { "from": "gpt", "value": "(B) toaster" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334624_385706530511208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, houseplant (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) houseplant\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261686_3761947956583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, pillow (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) pillow\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899209_186691372558750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to glass door (highlighted by a red box), window screen (highlighted by a blue box) or table (highlighted by a green box)?\n(A) window screen\n(B) table" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898696_580890385815791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from table (highlighted by a red box)? remote (highlighted by a blue box) or remote (highlighted by a green box)?\n(A) remote\n(B) remote" }, { "from": "gpt", "value": "(B) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899268_883886192670541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from bathtub (highlighted by a red box)? Select from bath towel (highlighted by a blue box) and towel bar (highlighted by a green box).\n(A) bath towel\n(B) towel bar" }, { "from": "gpt", "value": "(B) towel bar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739595_199616690156666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, laundry basket (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) laundry basket\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445599_285099827377416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, electric outlet (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) electric outlet\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739912_15718488209958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, stairwell (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) stairwell\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333056_60159093724625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to houseplant (highlighted by a red box)? houseplant (highlighted by a blue box) or table (highlighted by a green box).\n(A) houseplant\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899567_958831125781875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to remote (highlighted by a red box)? Choose from nightstand (highlighted by a blue box) and remote (highlighted by a green box).\n(A) nightstand\n(B) remote" }, { "from": "gpt", "value": "(B) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663347_91378098019291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, pillow (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) pillow\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445680_61994354846166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from table (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897478_112715143440000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, gadget (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) gadget\n(B) electric outlet" }, { "from": "gpt", "value": "(A) gadget" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899559_199462701351625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, sink (highlighted by a red box) or tile (highlighted by a blue box)?\n(A) sink\n(B) tile" }, { "from": "gpt", "value": "(B) tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332290_385263593763541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) chair\n(B) counter top" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899284_885302362469291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to counter top (highlighted by a red box)? screen door (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) screen door\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429773_359973029706916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) picture frame\n(B) houseplant" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828437_90416036529708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_4936192303000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or window (highlighted by a blue box)?\n(A) chair\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331036_476089119787083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, plant (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) plant\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331542_6948910226125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, postcard (highlighted by a red box) or stairs (highlighted by a blue box)?\n(A) postcard\n(B) stairs" }, { "from": "gpt", "value": "(A) postcard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896395_22785656280916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is chest of drawers (annotated by the red box) located relative to bedside lamp?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796324_16019283299541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, clothing (highlighted by a red box) or door (highlighted by a blue box)?\n(A) clothing\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662882_16749495892250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, dresser (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) dresser\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895912_111409944483541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, basket (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) basket\n(B) basket" }, { "from": "gpt", "value": "(A) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828476_100659055061208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, shelf (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) shelf\n(B) lamp" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662959_24585487399375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the window (highlighted by a red box)? Choose among these: cabinet (highlighted by a blue box) or light fixture (highlighted by a green box).\n(A) cabinet\n(B) light fixture" }, { "from": "gpt", "value": "(B) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204319_15911952363291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, person (highlighted by a red box) or sculpture (highlighted by a blue box)?\n(A) person\n(B) sculpture" }, { "from": "gpt", "value": "(A) person" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458688_9217492384875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to coffee table (highlighted by a red box)? stool (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) stool\n(B) studio couch" }, { "from": "gpt", "value": "(A) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331938_164758318342041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from desk (highlighted by a red box)? Choose among these: box (highlighted by a blue box) or box (highlighted by a green box).\n(A) box\n(B) box" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896396_22544356125708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, stairs (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) stairs\n(B) curtain" }, { "from": "gpt", "value": "(A) stairs" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204763_26805604509333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from computer mouse (highlighted by a red box)? Choose among these: screen door (highlighted by a blue box) or television (highlighted by a green box).\n(A) screen door\n(B) television" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261241_15093609024916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, desk (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) desk\n(B) table lamp" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898625_757832008075750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or mirror (highlighted by a blue box)?\n(A) door\n(B) mirror" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895910_110940244679166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bay window (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) bay window\n(B) cabinetry" }, { "from": "gpt", "value": "(A) bay window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430294_187652449339833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796226_2566918360333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, nightstand (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) nightstand\n(B) window sill" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260951_6083893193375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to chair (highlighted by a red box), picture frame (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) picture frame\n(B) chair" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445173_8219922639083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bay window (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) bay window\n(B) radiator" }, { "from": "gpt", "value": "(A) bay window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333666_131951104244624_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018815_19984739119875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, material (highlighted by a red box) or bathtub (highlighted by a blue box)?\n(A) material\n(B) bathtub" }, { "from": "gpt", "value": "(B) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828366_92020420871041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) chair\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204747_25236691735208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) picture frame\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898786_67362014647332_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the throw pillow (highlighted by a red box)? studio couch (highlighted by a blue box) or christmas tree (highlighted by a green box).\n(A) studio couch\n(B) christmas tree" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331093_134550009219375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, truck (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) truck\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261686_3823955572750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) window\n(B) studio couch" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444716_75617367790333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896224_4928704913333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bathtub (highlighted by a red box)? Choose among these: bath towel (highlighted by a blue box) or medicine cabinet (highlighted by a green box).\n(A) bath towel\n(B) medicine cabinet" }, { "from": "gpt", "value": "(A) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261297_16351830894083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, material (highlighted by a red box) or laundry (highlighted by a blue box)?\n(A) material\n(B) laundry" }, { "from": "gpt", "value": "(B) laundry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444758_80905955114583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, door (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) door\n(B) lamp" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431078_74770809122500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, candle holder (highlighted by a red box) or candle holder (highlighted by a blue box)?\n(A) candle holder\n(B) candle holder" }, { "from": "gpt", "value": "(B) candle holder" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828369_92318913870625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from mat (highlighted by a red box)? Choose from concrete (highlighted by a blue box) and chair (highlighted by a green box).\n(A) concrete\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896404_16707523236833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the speaker (highlighted by a red box)? window (highlighted by a blue box) or garbage (highlighted by a green box).\n(A) window\n(B) garbage" }, { "from": "gpt", "value": "(B) garbage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458228_76787772599708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, button (highlighted by a red box) or button (highlighted by a blue box)?\n(A) button\n(B) button" }, { "from": "gpt", "value": "(B) button" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471673814654041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is door (annotated by the red box) located in relation to plain in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739359_186955492237458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from window blind (highlighted by a red box)? window sill (highlighted by a blue box) or window (highlighted by a green box)?\n(A) window sill\n(B) window" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332591_362632078012208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, paper bag (highlighted by a red box) or step stool (highlighted by a blue box)?\n(A) paper bag\n(B) step stool" }, { "from": "gpt", "value": "(B) step stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261677_3049540525791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358407_40571670836166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, refrigerator (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) refrigerator\n(B) bottle" }, { "from": "gpt", "value": "(A) refrigerator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895626_470735038427625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cleaning product (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) cleaning product\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332480_338765610301833_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895192_38461635502541_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663065_38347988903500_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204919_3644497217000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the curtain (highlighted by a red box)? branch (highlighted by a blue box) or chair (highlighted by a green box).\n(A) branch\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796514_3249221120750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, screen door (highlighted by a red box) or window (highlighted by a blue box)?\n(A) screen door\n(B) window" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899899_1026839437681625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of curtain (annotated by the red box) and window in the image provided, where is curtain (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333625_76913561439916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458440_117482682231541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, book (highlighted by a red box) or cabinet (highlighted by a blue box)?\n(A) book\n(B) cabinet" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204786_27295567507458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from swivel chair (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333778_48257629915583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, luggage and bags (highlighted by a red box) or box (highlighted by a blue box)?\n(A) luggage and bags\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331154_181642708086250_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261601_52844902182750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to pillow (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331273_12863156128958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, curtain (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) curtain\n(B) shelf" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737888521914000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from mat (highlighted by a red box)? Choose from chair (highlighted by a blue box) and table (highlighted by a green box).\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898242_695939911801875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is folding chair (annotated by the red box) located in relation to pillow in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358428_41382672614666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to sink (highlighted by a red box)? Select from soap (highlighted by a blue box) and brush (highlighted by a green box).\n(A) soap\n(B) brush" }, { "from": "gpt", "value": "(A) soap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334628_386176645336166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, screen door (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) screen door\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649681_35597825332041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, soap dispenser (highlighted by a red box) or soap dispenser (highlighted by a blue box)?\n(A) soap dispenser\n(B) soap dispenser" }, { "from": "gpt", "value": "(B) soap dispenser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899513_197637044677416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, light fixture (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) light fixture\n(B) cabinetry" }, { "from": "gpt", "value": "(A) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896042_130088046926416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to towel bar (highlighted by a red box), bottle (highlighted by a blue box) or drawer (highlighted by a green box)?\n(A) bottle\n(B) drawer" }, { "from": "gpt", "value": "(B) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895972_406414952035291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896256_8095432561166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chest of drawers (highlighted by a red box) or window (highlighted by a blue box)?\n(A) chest of drawers\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669896_11072598900708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, dish washer (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) dish washer\n(B) doormat" }, { "from": "gpt", "value": "(A) dish washer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204387_23184783136208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bookshelf (highlighted by a red box)? furniture (highlighted by a blue box) or home appliance (highlighted by a green box).\n(A) furniture\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796745_28764076724791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) picture frame\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358660_1055200563375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, lamp (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898342_508353009358166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, furniture (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) furniture\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204506_650469066125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to cabinetry (highlighted by a red box), appliance (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670340_66249893418291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332952_21931401574291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cabinetry (highlighted by a red box)? lamp (highlighted by a blue box) or hood (highlighted by a green box)?\n(A) lamp\n(B) hood" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334652_389694643128333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cabinetry (highlighted by a red box) or slate (highlighted by a blue box)?\n(A) cabinetry\n(B) slate" }, { "from": "gpt", "value": "(B) slate" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739835_16834204819333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the sink (highlighted by a red box)? Choose among these: bath towel (highlighted by a blue box) or soap dispenser (highlighted by a green box).\n(A) bath towel\n(B) soap dispenser" }, { "from": "gpt", "value": "(B) soap dispenser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897643_146952180448958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to laundry (highlighted by a red box), chest of drawers (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) chest of drawers\n(B) chair" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333472_58514631365416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to material (highlighted by a red box)? Choose from chest of drawers (highlighted by a blue box) and shoe box (highlighted by a green box).\n(A) chest of drawers\n(B) shoe box" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429753_355352991142500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or exhaust hood (highlighted by a blue box)?\n(A) picture frame\n(B) exhaust hood" }, { "from": "gpt", "value": "(B) exhaust hood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334914_1090119864955000_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828340_78873427818458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to glass door (highlighted by a red box)? Choose from radiator (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) radiator\n(B) picture frame" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896019_138350181972625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446495_357663827845125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to cabinetry (highlighted by a red box)? towel (highlighted by a blue box) or towel (highlighted by a green box).\n(A) towel\n(B) towel" }, { "from": "gpt", "value": "(B) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332026_202851497620916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bottle (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or countertop (highlighted by a green box).\n(A) appliance\n(B) countertop" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895201_40079244845666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to oven (highlighted by a red box)? Select from appliance (highlighted by a blue box) and kitchen appliance (highlighted by a green box).\n(A) appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430950_96419347005666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bottle (highlighted by a red box)? Choose from light switch (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) light switch\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261344_24365537083791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or plaque (highlighted by a blue box)?\n(A) picture frame\n(B) plaque" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018286_799401413784291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from tile (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) appliance\n(B) bottle" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261219_13602814089625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to swivel chair (highlighted by a red box), screen door (highlighted by a blue box) or window screen (highlighted by a green box)?\n(A) screen door\n(B) window screen" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429774_360080819151708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the plant (highlighted by a red box)? furniture (highlighted by a blue box) or bed (highlighted by a green box).\n(A) furniture\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899111_128780968103000_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899640_231850088285125_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430239_181574274691333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to mouthwash (highlighted by a red box), bottle (highlighted by a blue box) or shower curtain (highlighted by a green box)?\n(A) bottle\n(B) shower curtain" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828230_69776622647540_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from picture frame (highlighted by a red box), table (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) table\n(B) cabinetry" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739603_199575389821833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from round table (highlighted by a red box)? grocery bag (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) grocery bag\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018119_368593021477625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from desk (highlighted by a red box), coffee cup (highlighted by a blue box) or dresser (highlighted by a green box)?\n(A) coffee cup\n(B) dresser" }, { "from": "gpt", "value": "(B) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358253_6159043874041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to pillow (highlighted by a red box), pillow (highlighted by a blue box) or stripe (highlighted by a green box)?\n(A) pillow\n(B) stripe" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446561_86518462985833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261164_721914401791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) table\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663312_76620381018416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, mirror (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) mirror\n(B) screen door" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444514_3809135901541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, soap (highlighted by a red box) or shaving cream (highlighted by a blue box)?\n(A) soap\n(B) shaving cream" }, { "from": "gpt", "value": "(A) soap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899498_197899552649250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to cabinetry (highlighted by a red box)? chair (highlighted by a blue box) or kitchen & dining room table (highlighted by a green box).\n(A) chair\n(B) kitchen & dining room table" }, { "from": "gpt", "value": "(B) kitchen & dining room table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334733_535815432605291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, plant (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) plant\n(B) paperback book" }, { "from": "gpt", "value": "(A) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430293_187348355863958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the dresser (highlighted by a red box)? Choose among these: table (highlighted by a blue box) or rocking chair (highlighted by a green box).\n(A) table\n(B) rocking chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898360_511719478762083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, Wii controller (highlighted by a red box) or control (highlighted by a blue box)?\n(A) Wii controller\n(B) control" }, { "from": "gpt", "value": "(A) Wii controller" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261413_29635401651208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the lamp (highlighted by a red box)? printer (highlighted by a blue box) or file cabinet (highlighted by a green box).\n(A) printer\n(B) file cabinet" }, { "from": "gpt", "value": "(A) printer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260946_4711897700000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, pillar (highlighted by a red box) or stove (highlighted by a blue box)?\n(A) pillar\n(B) stove" }, { "from": "gpt", "value": "(B) stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261651_1381031756708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from pillow (highlighted by a red box)? Select from side table (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) side table\n(B) pillow" }, { "from": "gpt", "value": "(A) side table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458524_125806166029708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, television (highlighted by a red box) or door (highlighted by a blue box)?\n(A) television\n(B) door" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899236_880490331906500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, furniture (highlighted by a red box) or balloon (highlighted by a blue box)?\n(A) furniture\n(B) balloon" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796596_18021679285583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899663_234365461457958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bulletin board (highlighted by a red box) or stool (highlighted by a blue box)?\n(A) bulletin board\n(B) stool" }, { "from": "gpt", "value": "(A) bulletin board" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739916_15615395628000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796751_29755663005750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from furniture (highlighted by a red box)? furniture (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) furniture\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670133_40061875983791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, sink (highlighted by a red box) or step stool (highlighted by a blue box)?\n(A) sink\n(B) step stool" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429826_746703195803750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to toilet (highlighted by a red box)? Choose from toilet paper (highlighted by a blue box) and toilet paper (highlighted by a green box).\n(A) toilet paper\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204392_22988081540541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to picture frame (highlighted by a red box)? Select from radiator (highlighted by a blue box) and chair (highlighted by a green box).\n(A) radiator\n(B) chair" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018404_393246890272333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, brush (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) brush\n(B) cleaning product" }, { "from": "gpt", "value": "(A) brush" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445902_68258593636416_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333657_130188071247000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) window\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333493_62599493816000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, houseplant (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) houseplant\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261275_14245156588041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or window (highlighted by a blue box)?\n(A) picture frame\n(B) window" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446492_356641053837541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, microwave oven (highlighted by a red box) or rail (highlighted by a blue box)?\n(A) microwave oven\n(B) rail" }, { "from": "gpt", "value": "(B) rail" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_4856190633958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from table (highlighted by a red box)? Choose among these: table lamp (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670350_67396590783208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, fireplace (highlighted by a red box) or window (highlighted by a blue box)?\n(A) fireplace\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261527_45668743812125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or bean bag chair (highlighted by a blue box)?\n(A) door\n(B) bean bag chair" }, { "from": "gpt", "value": "(B) bean bag chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261406_29726698852583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to shelf (highlighted by a red box), table lamp (highlighted by a blue box) or screen door (highlighted by a green box)?\n(A) table lamp\n(B) screen door" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444907_106150764927958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to home appliance (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and coffee machine (highlighted by a green box).\n(A) cabinetry\n(B) coffee machine" }, { "from": "gpt", "value": "(B) coffee machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896224_4904698228041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of bath towel (annotated by the red box) in relation to tap? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663377_92435694978583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, candle holder (highlighted by a red box) or floral arrangement (highlighted by a blue box)?\n(A) candle holder\n(B) floral arrangement" }, { "from": "gpt", "value": "(A) candle holder" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895587_1160176437482666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018420_395530511898916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of table (annotated by the red box) in reference to glass door? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899270_883829299400250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from sink (highlighted by a red box)? light switch (highlighted by a blue box) or mirror (highlighted by a green box)?\n(A) light switch\n(B) mirror" }, { "from": "gpt", "value": "(A) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47330995_176927284418916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, appliance (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331356_194723343638583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chest of drawers (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) chest of drawers\n(B) electric outlet" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737777933252666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to pillow (highlighted by a red box)? Choose from table (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) table\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333018_130147209440833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, box (highlighted by a red box) or door (highlighted by a blue box)?\n(A) box\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331615_18099976610166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhere is window frame (annotated by the red box) located in relation to plain in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899187_184374783707666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of bed (annotated by the red box) in reference to picture frame? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828311_76548535772833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from microwave oven (highlighted by a red box), home appliance (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) home appliance\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458690_135422786338875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to magazine (highlighted by a red box)? Choose from window (highlighted by a blue box) and desk (highlighted by a green box).\n(A) window\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334274_156999378164000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, shelf (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) shelf\n(B) shelf" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899184_184459981705416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the mirror (highlighted by a red box)? Choose among these: mat (highlighted by a blue box) or trash bin/can (highlighted by a green box).\n(A) mat\n(B) trash bin/can" }, { "from": "gpt", "value": "(A) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663051_36165367715875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window (highlighted by a red box) or sculpture (highlighted by a blue box)?\n(A) window\n(B) sculpture" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895910_110845434119625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to folding chair (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430449_1701039705666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to television (highlighted by a red box), table (highlighted by a blue box) or table lamp (highlighted by a green box)?\n(A) table\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115158_87693286790500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of plywood (annotated by the red box) and lamp in the image provided, where is plywood (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445587_284688841030875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or tablet computer (highlighted by a blue box)?\n(A) door\n(B) tablet computer" }, { "from": "gpt", "value": "(B) tablet computer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458228_76765765041333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, pillow (highlighted by a red box) or laundry basket (highlighted by a blue box)?\n(A) pillow\n(B) laundry basket" }, { "from": "gpt", "value": "(B) laundry basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331159_181771022763125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bottle (highlighted by a red box)? Choose among these: bottle (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896251_8011933925291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from door (highlighted by a red box)? shower curtain (highlighted by a blue box) or door (highlighted by a green box)?\n(A) shower curtain\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334267_156732270508916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) chair\n(B) curtain" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896404_16753321704916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from appliance (highlighted by a red box)? Choose among these: toaster (highlighted by a blue box) or teapot (highlighted by a green box).\n(A) toaster\n(B) teapot" }, { "from": "gpt", "value": "(A) toaster" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649707_47747745139583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the window (highlighted by a red box)? balcony (highlighted by a blue box) or chair (highlighted by a green box).\n(A) balcony\n(B) chair" }, { "from": "gpt", "value": "(A) balcony" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739641_2261847174166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from radiator (highlighted by a red box)? Choose among these: bath towel (highlighted by a blue box) or chest of drawers (highlighted by a green box).\n(A) bath towel\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332710_109926610967625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, kit (highlighted by a red box) or kit (highlighted by a blue box)?\n(A) kit\n(B) kit" }, { "from": "gpt", "value": "(A) kit" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332644_368004458914833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, door (highlighted by a red box) or hardwood (highlighted by a blue box)?\n(A) door\n(B) hardwood" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898551_181878178876541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333888_78852261581708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, curtain (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) curtain\n(B) pillow" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796598_18076290012791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261096_1246455899000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to shelf (highlighted by a red box)? Select from book (highlighted by a blue box) and basket (highlighted by a green box).\n(A) book\n(B) basket" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331587_15981983193166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from book (highlighted by a red box)? bird cage (highlighted by a blue box) or book (highlighted by a green box)?\n(A) bird cage\n(B) book" }, { "from": "gpt", "value": "(A) bird cage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669927_14254970922166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the computer monitor (highlighted by a red box)? mat (highlighted by a blue box) or chair (highlighted by a green box).\n(A) mat\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334754_421185704261583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from houseplant (highlighted by a red box), window sill (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) window sill\n(B) houseplant" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429826_746654798680208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to toilet paper (highlighted by a red box)? Select from concrete (highlighted by a blue box) and toilet (highlighted by a green box).\n(A) concrete\n(B) toilet" }, { "from": "gpt", "value": "(B) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446576_205915538249291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the table (highlighted by a red box)? houseplant (highlighted by a blue box) or remote (highlighted by a green box).\n(A) houseplant\n(B) remote" }, { "from": "gpt", "value": "(B) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896196_142339638959458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from pillow (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670350_67506580615916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the window (highlighted by a red box)? glass vase (highlighted by a blue box) or window sill (highlighted by a green box).\n(A) glass vase\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898587_184543774841125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to chair (highlighted by a red box)? chair (highlighted by a blue box) or round table (highlighted by a green box).\n(A) chair\n(B) round table" }, { "from": "gpt", "value": "(B) round table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444588_31765305081541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from tap (highlighted by a red box), cabinetry (highlighted by a blue box) or countertop (highlighted by a green box)?\n(A) cabinetry\n(B) countertop" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896169_140715516608915_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796498_1578069761708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the corridor (highlighted by a red box)? Choose among these: door handle (highlighted by a blue box) or door (highlighted by a green box).\n(A) door handle\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458337_102894726342416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bean bag chair (highlighted by a red box) or baby (highlighted by a blue box)?\n(A) bean bag chair\n(B) baby" }, { "from": "gpt", "value": "(B) baby" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333635_123691709981291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to bottle (highlighted by a red box)? countertop (highlighted by a blue box) or hand towel (highlighted by a green box).\n(A) countertop\n(B) hand towel" }, { "from": "gpt", "value": "(B) hand towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896160_139924083889541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, counter top (highlighted by a red box) or toothbrush (highlighted by a blue box)?\n(A) counter top\n(B) toothbrush" }, { "from": "gpt", "value": "(A) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895921_111976016596375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, poster page (highlighted by a red box) or weight (highlighted by a blue box)?\n(A) poster page\n(B) weight" }, { "from": "gpt", "value": "(A) poster page" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670063_37949515958833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to pillow (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and studio couch (highlighted by a green box).\n(A) cabinetry\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204505_874759424791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from banana (highlighted by a red box), bowl (highlighted by a blue box) or stool (highlighted by a green box)?\n(A) bowl\n(B) stool" }, { "from": "gpt", "value": "(B) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261392_27819559996000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, studio couch (highlighted by a red box) or coffee table (highlighted by a blue box)?\n(A) studio couch\n(B) coffee table" }, { "from": "gpt", "value": "(B) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649742_49630999386250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or couple (highlighted by a blue box)?\n(A) picture frame\n(B) couple" }, { "from": "gpt", "value": "(B) couple" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896304_6874137337666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) table\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896063_132133000843041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, sink (highlighted by a red box) or cabinet (highlighted by a blue box)?\n(A) sink\n(B) cabinet" }, { "from": "gpt", "value": "(B) cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895179_37968476940208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from chest of drawers (highlighted by a red box)? desktop computer (highlighted by a blue box) or tight (highlighted by a green box)?\n(A) desktop computer\n(B) tight" }, { "from": "gpt", "value": "(B) tight" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669927_14248956633166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, laptop (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) laptop\n(B) chair" }, { "from": "gpt", "value": "(A) laptop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358700_5228664780125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, toilet paper (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) toilet paper\n(B) toilet paper" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_408942299146500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or window (highlighted by a blue box)?\n(A) chair\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331711_11301309654541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, countertop (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) countertop\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018320_110231288424041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from towel/napkin (highlighted by a red box)? Choose from drawer (highlighted by a blue box) and towel/napkin (highlighted by a green box).\n(A) drawer\n(B) towel/napkin" }, { "from": "gpt", "value": "(A) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899002_640970213017041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, collage (highlighted by a red box) or window (highlighted by a blue box)?\n(A) collage\n(B) window" }, { "from": "gpt", "value": "(A) collage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334171_350615458133208_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899653_233596474149916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, letter (highlighted by a red box) or letter (highlighted by a blue box)?\n(A) letter\n(B) letter" }, { "from": "gpt", "value": "(B) letter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899905_1027866568861166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of door (annotated by the red box) in reference to clothing?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458602_125134755802250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to screen door (highlighted by a red box)? chest of drawers (highlighted by a blue box) or mirror (highlighted by a green box).\n(A) chest of drawers\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115265_115091265083291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, power outlet (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) power outlet\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897512_472740506589875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, box (highlighted by a red box) or drawer (highlighted by a blue box)?\n(A) box\n(B) drawer" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446462_354250426656458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from pillow (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or door (highlighted by a green box).\n(A) chair\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899034_643250625234583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, christmas tree (highlighted by a red box) or robe (highlighted by a blue box)?\n(A) christmas tree\n(B) robe" }, { "from": "gpt", "value": "(A) christmas tree" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018107_367882921914250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table lamp (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) table lamp\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204362_15637125910333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or shutter (highlighted by a blue box)?\n(A) picture frame\n(B) shutter" }, { "from": "gpt", "value": "(B) shutter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204304_15060173425750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from pillow (highlighted by a red box)? Select from chair (highlighted by a blue box) and table (highlighted by a green box).\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334660_390812588727791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, curtain (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) curtain\n(B) studio couch" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358105_61909883366250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663415_95950867892833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), pillow (highlighted by a blue box) or studio couch (highlighted by a green box)?\n(A) pillow\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828250_81617494194916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to electric outlet (highlighted by a red box)? door (highlighted by a blue box) or bath (highlighted by a green box).\n(A) door\n(B) bath" }, { "from": "gpt", "value": "(B) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896491_31452142649541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, lamp (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) lamp\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458700_135320793413707_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from magazine (highlighted by a red box)? Select from table (highlighted by a blue box) and drawer (highlighted by a green box).\n(A) table\n(B) drawer" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115222_95762735981041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table lamp (highlighted by a red box) or wine bottle (highlighted by a blue box)?\n(A) table lamp\n(B) wine bottle" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445594_285292131361791_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662884_16521785989666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) cabinetry\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896231_6983717133500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from studio couch (highlighted by a red box), pillow (highlighted by a blue box) or screen door (highlighted by a green box)?\n(A) pillow\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896308_6704637752541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the refrigerator (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or tile (highlighted by a green box).\n(A) door\n(B) tile" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896133_147066722700875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the candle (highlighted by a red box)? lamp (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) lamp\n(B) lamp" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358647_2969830627750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bar stool (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) bar stool\n(B) appliance" }, { "from": "gpt", "value": "(A) bar stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898340_508444505095416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, mechanical fan (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) mechanical fan\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11285703317583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to furniture (highlighted by a red box), wall clock (highlighted by a blue box) or table (highlighted by a green box)?\n(A) wall clock\n(B) table" }, { "from": "gpt", "value": "(A) wall clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331084_133857978875416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, furniture (highlighted by a red box) or laptop (highlighted by a blue box)?\n(A) furniture\n(B) laptop" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899559_199458703007791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, lamp (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) lamp\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204724_23540529786583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, curtain (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) curtain\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018267_793719782687208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the pillow (highlighted by a red box)? bed (highlighted by a blue box) or window (highlighted by a green box).\n(A) bed\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204319_15937958253958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to shelf (highlighted by a red box)? Select from bottle (highlighted by a blue box) and cupboard (highlighted by a green box).\n(A) bottle\n(B) cupboard" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669854_12647449164208_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897480_470946233224041_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898530_181126762740458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to door (highlighted by a red box), picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896126_147316518747666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is shelf (annotated by the red box) located relative to bulletin board? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895482_134791425835416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, book (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) book\n(B) toy" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897713_111832402936500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333581_207624021612833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of vegetation (annotated by the red box) in relation to curtain? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333144_40488721097291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chair (highlighted by a red box)? desk (highlighted by a blue box) or television (highlighted by a green box)?\n(A) desk\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115628_3421094320416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430310_264992251380625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from floral arrangement (highlighted by a red box)? table (highlighted by a blue box) or journal (highlighted by a green box)?\n(A) table\n(B) journal" }, { "from": "gpt", "value": "(B) journal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429758_356954659198500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445716_63653512331875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to door (highlighted by a red box)? Select from door (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) door\n(B) curtain" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331617_18263376842000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cupboard (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) cupboard\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115199_94498746694666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, electric outlet (highlighted by a red box) or headboard (highlighted by a blue box)?\n(A) electric outlet\n(B) headboard" }, { "from": "gpt", "value": "(B) headboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261406_29838804522833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, electric outlet (highlighted by a red box) or headboard (highlighted by a blue box)?\n(A) electric outlet\n(B) headboard" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899198_186624383700375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from studio couch (highlighted by a red box)? Choose among these: coffee table (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) coffee table\n(B) pillow" }, { "from": "gpt", "value": "(A) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896251_8017931436875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toilet (highlighted by a red box) or bathtub (highlighted by a blue box)?\n(A) toilet\n(B) bathtub" }, { "from": "gpt", "value": "(A) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115352_4059002388500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from christmas decoration (highlighted by a red box)? Select from television (highlighted by a blue box) and fireplace (highlighted by a green box).\n(A) television\n(B) fireplace" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261455_35819447190166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, television (highlighted by a red box) or equipment (highlighted by a blue box)?\n(A) television\n(B) equipment" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895574_1153859235153166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is gas stove (annotated by the red box) located in relation to paper towel in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332609_363453012423625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to screen door (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445132_5411842372708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cloth (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) cloth\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) cloth" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115412_4194748648375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from table (highlighted by a red box)? Select from basket (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) basket\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669881_10908897013333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: furniture (highlighted by a blue box) or home appliance (highlighted by a green box).\n(A) furniture\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828441_91577034904041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333110_108802394790458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, screen door (highlighted by a red box) or glass vase (highlighted by a blue box)?\n(A) screen door\n(B) glass vase" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429728_19169042443333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from book (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261096_1316443555666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or bowl (highlighted by a blue box)?\n(A) chair\n(B) bowl" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331700_9652230303958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, electric outlet (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) electric outlet\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899491_197814354604125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or window (highlighted by a green box).\n(A) cabinetry\n(B) window" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895249_75906186030583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) picture frame\n(B) ceramic tile" }, { "from": "gpt", "value": "(B) ceramic tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204730_23400621082625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chair (highlighted by a red box)? entertainment center (highlighted by a blue box) or footrest (highlighted by a green box)?\n(A) entertainment center\n(B) footrest" }, { "from": "gpt", "value": "(B) footrest" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663398_95022301333625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from bottle (highlighted by a red box)? chair (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) chair\n(B) houseplant" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204390_23048889639541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from cabinetry (highlighted by a red box)? fireplace (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) fireplace\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332074_249877983408333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, furniture (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) furniture\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898988_823955704327041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334202_103302992331416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, flannel (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) flannel\n(B) houseplant" }, { "from": "gpt", "value": "(A) flannel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896379_20419944019125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) picture frame\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895469_132748018627541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or television (highlighted by a blue box)?\n(A) picture frame\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445848_69403462661916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, footwear (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) footwear\n(B) footwear" }, { "from": "gpt", "value": "(A) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334966_669413082233625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window screen (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) window screen\n(B) radiator" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895286_80185542917291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bed (highlighted by a red box) or nightstand (highlighted by a blue box)?\n(A) bed\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897947_533461625364291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, sink (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) sink\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331240_284323924614541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from pillow (highlighted by a red box)? Choose from nightstand (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739729_3100775932166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, refrigerator (highlighted by a red box) or microwave oven (highlighted by a blue box)?\n(A) refrigerator\n(B) microwave oven" }, { "from": "gpt", "value": "(A) refrigerator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669927_14262967761708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, washing machine (highlighted by a red box) or plant (highlighted by a blue box)?\n(A) washing machine\n(B) plant" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018276_794870779573083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, electric outlet (highlighted by a red box) or hardwood (highlighted by a blue box)?\n(A) electric outlet\n(B) hardwood" }, { "from": "gpt", "value": "(B) hardwood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796744_28952068847333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, coffee table (highlighted by a red box) or bedding (highlighted by a blue box)?\n(A) coffee table\n(B) bedding" }, { "from": "gpt", "value": "(A) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896469_21828086699875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or shower door (highlighted by a blue box)?\n(A) picture frame\n(B) shower door" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444750_79678468582208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of lighting (annotated by the red box) in reference to door?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204585_614222969833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to door (highlighted by a red box)? Choose from door (highlighted by a blue box) and door (highlighted by a green box).\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649417_10157597841916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, book (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) book\n(B) houseplant" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334935_663088899377500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to lamp (highlighted by a red box)? plant (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) plant\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204305_15145271434750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_4936192303000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from chair (highlighted by a red box)? Select from curtain (highlighted by a blue box) and dresser (highlighted by a green box).\n(A) curtain\n(B) dresser" }, { "from": "gpt", "value": "(B) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458221_76898959859625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of laundry basket (annotated by the red box) in reference to mat?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018334_116256999035708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the cardboard box (highlighted by a red box)? cardboard box (highlighted by a blue box) or lighting (highlighted by a green box).\n(A) cardboard box\n(B) lighting" }, { "from": "gpt", "value": "(A) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204505_838757707750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, television (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) television\n(B) cabinetry" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430392_125984266466125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828552_101594709492125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, bar stool (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) bar stool\n(B) bath towel" }, { "from": "gpt", "value": "(A) bar stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458717_137690891346666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to shower door (highlighted by a red box), tile (highlighted by a blue box) or tap (highlighted by a green box)?\n(A) tile\n(B) tap" }, { "from": "gpt", "value": "(A) tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204680_13274673173458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bathroom cabinet (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) bathroom cabinet\n(B) screen door" }, { "from": "gpt", "value": "(A) bathroom cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358362_16164155798666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445583_283663365888666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from desk (highlighted by a red box)? Choose from bed (highlighted by a blue box) and chair (highlighted by a green box).\n(A) bed\n(B) chair" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261317_23547481855833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) chair\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24808502075750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from picture frame (highlighted by a red box)? window (highlighted by a blue box) or window (highlighted by a green box)?\n(A) window\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204390_23016786300750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, television (highlighted by a red box) or shopping bag (highlighted by a blue box)?\n(A) television\n(B) shopping bag" }, { "from": "gpt", "value": "(B) shopping bag" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649478_14907540219708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to table lamp (highlighted by a red box), book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446025_134721311270583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the toy (highlighted by a red box)? Choose among these: table (highlighted by a blue box) or chair (highlighted by a green box).\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670224_53961172350958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhere is flower (annotated by the red box) located in relation to window in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332197_263690737114375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, toilet paper (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) toilet paper\n(B) bath mat" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332764_43964127466916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, throw pillow (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) throw pillow\n(B) studio couch" }, { "from": "gpt", "value": "(A) throw pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796692_30714245619500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, light switch (highlighted by a red box) or door (highlighted by a blue box)?\n(A) light switch\n(B) door" }, { "from": "gpt", "value": "(A) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333045_59515562460666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, air conditioning (highlighted by a red box) or computer monitor (highlighted by a blue box)?\n(A) air conditioning\n(B) computer monitor" }, { "from": "gpt", "value": "(A) air conditioning" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430598_315311627268833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of fireplace (annotated by the red box) and mat in the image provided, where is fireplace (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828390_94716597024708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the pillow (highlighted by a red box)? nightstand (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828320_76249737274166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from cabinetry (highlighted by a red box)? Select from exhaust hood (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) exhaust hood\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115394_3346863964583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or plant (highlighted by a blue box)?\n(A) picture frame\n(B) plant" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333847_74996233794708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018462_527487779128916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from houseplant (highlighted by a red box)? houseplant (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895179_37913665855833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the paperback book (highlighted by a red box)? picture frame (highlighted by a blue box) or book (highlighted by a green box).\n(A) picture frame\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358386_19226751070750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) table\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333803_51572838853625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to curtain (highlighted by a red box)? Choose from houseplant (highlighted by a blue box) and window (highlighted by a green box).\n(A) houseplant\n(B) window" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670028_32342506991708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, fridge (highlighted by a red box) or table (highlighted by a blue box)?\n(A) fridge\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670234_52926975403333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from mirror (highlighted by a red box)? towel (highlighted by a blue box) or towel bar (highlighted by a green box)?\n(A) towel\n(B) towel bar" }, { "from": "gpt", "value": "(B) towel bar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430608_315207619999416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from houseplant (highlighted by a red box), animal (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) animal\n(B) houseplant" }, { "from": "gpt", "value": "(A) animal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334058_86130489075541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from light switch (highlighted by a red box)? Choose among these: shelf (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) shelf\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11275707475000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, clock (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) clock\n(B) chair" }, { "from": "gpt", "value": "(A) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899112_128900170150708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, extinguisher (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) extinguisher\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895572_1153804840414125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, plant (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) plant\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828493_101848298849041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window frame (highlighted by a red box) or mixing bowl (highlighted by a blue box)?\n(A) window frame\n(B) mixing bowl" }, { "from": "gpt", "value": "(B) mixing bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899573_959548533264666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the kitchen appliance (highlighted by a red box)? home appliance (highlighted by a blue box) or kitchen appliance (highlighted by a green box).\n(A) home appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445583_283675360936416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of furniture (annotated by the red box) in relation to garbage?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334966_669390774607875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table lamp (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) table lamp\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018825_647317371762250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the chair (highlighted by a red box)? houseplant (highlighted by a blue box) or window screen (highlighted by a green box).\n(A) houseplant\n(B) window screen" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663415_95898871826125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the window sill (highlighted by a red box)? window (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) window\n(B) pillow" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429816_744567901325958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, nightstand (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899598_202528227363416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to bed (highlighted by a red box), bedside lamp (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) bedside lamp\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669880_11182305415083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: faucet (highlighted by a blue box) or home appliance (highlighted by a green box).\n(A) faucet\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897798_131238113192958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cabinetry (highlighted by a red box)? bottle (highlighted by a blue box) or sink (highlighted by a green box)?\n(A) bottle\n(B) sink" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331617_18214979868583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, glass vase (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) glass vase\n(B) pillow" }, { "from": "gpt", "value": "(A) glass vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358328_19155069149875_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331910_627541870315208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the door (highlighted by a red box)? Choose among these: bed (highlighted by a blue box) or door (highlighted by a green box).\n(A) bed\n(B) door" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331080_133649879583833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the screen door (highlighted by a red box)? Choose among these: screen door (highlighted by a blue box) or towel (highlighted by a green box).\n(A) screen door\n(B) towel" }, { "from": "gpt", "value": "(B) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828311_76532542097666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, television (highlighted by a red box) or table (highlighted by a blue box)?\n(A) television\n(B) table" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24329815141125_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444751_79741875800916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, appliance (highlighted by a red box) or window (highlighted by a blue box)?\n(A) appliance\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896354_18679105215125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, couch (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) couch\n(B) studio couch" }, { "from": "gpt", "value": "(A) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444706_73270573655250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from chest of drawers (highlighted by a red box)? light switch (highlighted by a blue box) or light switch (highlighted by a green box)?\n(A) light switch\n(B) light switch" }, { "from": "gpt", "value": "(B) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899340_714866946403708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, furniture (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) furniture\n(B) screen door" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333281_25554132956458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) picture frame\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24427808363250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the picture frame (highlighted by a red box)? Choose among these: houseplant (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895507_452180923782625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) door\n(B) screen door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_5106191629541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, shelf (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) shelf\n(B) window sill" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115216_95061233563625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, studio couch (highlighted by a red box) or window (highlighted by a blue box)?\n(A) studio couch\n(B) window" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334615_385665630524500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017828_696944674861000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from tile (highlighted by a red box)? Select from mat (highlighted by a blue box) and mat (highlighted by a green box).\n(A) mat\n(B) mat" }, { "from": "gpt", "value": "(A) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204387_23162475758541_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358345_15154818681208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, dresser (highlighted by a red box) or window (highlighted by a blue box)?\n(A) dresser\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895465_130616002385250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, coffee cup (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) coffee cup\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430814_65781688351708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, appliance (highlighted by a red box) or frying pan (highlighted by a blue box)?\n(A) appliance\n(B) frying pan" }, { "from": "gpt", "value": "(B) frying pan" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445639_58352774815666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899955_865610862726333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is dresser (annotated by the red box) located relative to curtain?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444859_96524852976583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to box (highlighted by a red box)? plastic bag (highlighted by a blue box) or doormat (highlighted by a green box).\n(A) plastic bag\n(B) doormat" }, { "from": "gpt", "value": "(B) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649409_10216691132583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from houseplant (highlighted by a red box), curtain (highlighted by a blue box) or book (highlighted by a green box)?\n(A) curtain\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333033_58876031140125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chest of drawers (highlighted by a red box), chest of drawers (highlighted by a blue box) or book (highlighted by a green box)?\n(A) chest of drawers\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261317_23539485173416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from pillow (highlighted by a red box)? book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332287_385402004300958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to chair (highlighted by a red box)? Choose from chair (highlighted by a blue box) and table (highlighted by a green box).\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649714_47880656593000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, droplight (highlighted by a red box) or window frame (highlighted by a blue box)?\n(A) droplight\n(B) window frame" }, { "from": "gpt", "value": "(A) droplight" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739276_42897464555083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from desk (highlighted by a red box)? stool (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) stool\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331915_629349186549458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, book (highlighted by a red box) or speaker (highlighted by a blue box)?\n(A) book\n(B) speaker" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899318_887493705348250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table (highlighted by a red box) or floral arrangement (highlighted by a blue box)?\n(A) table\n(B) floral arrangement" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899935_863074774296791_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331294_14775743852083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from radiator (highlighted by a red box), bed (highlighted by a blue box) or stuff (highlighted by a green box)?\n(A) bed\n(B) stuff" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897815_132662496303666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from window (highlighted by a red box)? furniture (highlighted by a blue box) or balustrade (highlighted by a green box)?\n(A) furniture\n(B) balustrade" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115265_115167268360625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649603_36113594734916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bedside lamp (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or coffee table (highlighted by a green box).\n(A) pillow\n(B) coffee table" }, { "from": "gpt", "value": "(B) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358168_61058041288583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, desk (highlighted by a red box) or door (highlighted by a blue box)?\n(A) desk\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895245_75688991775666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, book (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) book\n(B) pillow" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358173_62543045429625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or tile (highlighted by a blue box)?\n(A) furniture\n(B) tile" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358176_62243630758625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) furniture\n(B) bath mat" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018098_367343310317291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to writing (highlighted by a red box)? drawer (highlighted by a blue box) or mirror (highlighted by a green box).\n(A) drawer\n(B) mirror" }, { "from": "gpt", "value": "(A) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204316_15865055111958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to curtain (highlighted by a red box), furniture (highlighted by a blue box) or radiator (highlighted by a green box)?\n(A) furniture\n(B) radiator" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358252_6113645164041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, christmas tree (highlighted by a red box) or table (highlighted by a blue box)?\n(A) christmas tree\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670334_66336192609833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445997_133905461484291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, countertop (highlighted by a red box) or faucet (highlighted by a blue box)?\n(A) countertop\n(B) faucet" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334756_421270503276166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from cabinetry (highlighted by a red box)? Choose among these: electric outlet (highlighted by a blue box) or window (highlighted by a green box).\n(A) electric outlet\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445745_65666532232875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, mirror (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) mirror\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828272_84528784726791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of home appliance (annotated by the red box) in reference to furniture?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899899_1026859429520250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bed (highlighted by a red box) or bay window (highlighted by a blue box)?\n(A) bed\n(B) bay window" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332184_262653617937166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, square (highlighted by a red box) or postcard (highlighted by a blue box)?\n(A) square\n(B) postcard" }, { "from": "gpt", "value": "(B) postcard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898903_817228029514625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, material (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) material\n(B) sink" }, { "from": "gpt", "value": "(A) material" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334853_615535438842416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) door\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261331_24080929054041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bathtub (highlighted by a red box)? toilet (highlighted by a blue box) or basket (highlighted by a green box).\n(A) toilet\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204296_14327601456458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from curtain (highlighted by a red box)? bulletin board (highlighted by a blue box) or door (highlighted by a green box)?\n(A) bulletin board\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334912_1090005077882125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cabinetry (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) cabinetry\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663007_32268109466666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from plain (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018012_458829274357333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or notepad (highlighted by a blue box)?\n(A) chair\n(B) notepad" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739459_51773593372791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window (highlighted by a red box), tripod (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) tripod\n(B) curtain" }, { "from": "gpt", "value": "(A) tripod" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334202_103338194798000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the refrigerator (highlighted by a red box)? window (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796475_4222925139250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) furniture\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669959_27826893551833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the sink (highlighted by a red box)? Choose among these: window sill (highlighted by a blue box) or coffee machine (highlighted by a green box).\n(A) window sill\n(B) coffee machine" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444781_50230805261416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, curtain (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) curtain\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669881_10934903395541_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from sink (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or door (highlighted by a green box).\n(A) cabinetry\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663322_77605666807583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, coffee table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) coffee table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331174_276468901891000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, laundry (highlighted by a red box) or cabinet (highlighted by a blue box)?\n(A) laundry\n(B) cabinet" }, { "from": "gpt", "value": "(B) cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333562_200678381241791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from towel (highlighted by a red box)? towel (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) towel\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739914_15575694649708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window sill (highlighted by a red box) or window (highlighted by a blue box)?\n(A) window sill\n(B) window" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332321_390760968189666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from vegetation (highlighted by a red box)? Choose among these: cabinet (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) cabinet\n(B) curtain" }, { "from": "gpt", "value": "(A) cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018580_5571689392833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018227_469035313903375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or floral arrangement (highlighted by a blue box)?\n(A) table\n(B) floral arrangement" }, { "from": "gpt", "value": "(B) floral arrangement" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115519_13204268714958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to toiletry (highlighted by a red box)? Select from sink (highlighted by a blue box) and door (highlighted by a green box).\n(A) sink\n(B) door" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333475_58610242777041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhere is furniture (annotated by the red box) located in relation to bean bag chair in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204795_24291833544416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, kitchen appliance (highlighted by a red box) or gas stove (highlighted by a blue box)?\n(A) kitchen appliance\n(B) gas stove" }, { "from": "gpt", "value": "(B) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358162_60948734512041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from curtain (highlighted by a red box), lamp (highlighted by a blue box) or screen door (highlighted by a green box)?\n(A) lamp\n(B) screen door" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796475_4200934254957_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, sheet (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) sheet\n(B) pillow" }, { "from": "gpt", "value": "(A) sheet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261725_2762400622208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, kitchen & dining room table (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) kitchen & dining room table\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017894_80908156981166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, houseplant (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) houseplant\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332795_47484000044500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from storage box (highlighted by a red box)? Choose among these: shelf (highlighted by a blue box) or toy (highlighted by a green box).\n(A) shelf\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445697_62735101504916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to book (highlighted by a red box)? Choose from book (highlighted by a blue box) and lamp (highlighted by a green box).\n(A) book\n(B) lamp" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334482_103396724222916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, medicine cabinet (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) medicine cabinet\n(B) bath mat" }, { "from": "gpt", "value": "(A) medicine cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018785_18256441137333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bed (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bed\n(B) bottle" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331276_12744854227916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, houseplant (highlighted by a red box) or stool (highlighted by a blue box)?\n(A) houseplant\n(B) stool" }, { "from": "gpt", "value": "(B) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115304_119499025698166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to lamp (highlighted by a red box)? Select from curtain (highlighted by a blue box) and bay window (highlighted by a green box).\n(A) curtain\n(B) bay window" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446588_206039137132041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to curtain (highlighted by a red box), houseplant (highlighted by a blue box) or leaf (highlighted by a green box)?\n(A) houseplant\n(B) leaf" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899936_863349977174125_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895859_489152755897541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the toy (highlighted by a red box)? radiator (highlighted by a blue box) or bed (highlighted by a green box).\n(A) radiator\n(B) bed" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796230_2580612678083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from desk (highlighted by a red box)? swivel chair (highlighted by a blue box) or radiator (highlighted by a green box)?\n(A) swivel chair\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_4900189888750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from chair (highlighted by a red box)? Select from curtain (highlighted by a blue box) and table lamp (highlighted by a green box).\n(A) curtain\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429729_18993247384125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, curtain (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) curtain\n(B) radiator" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333104_108754081071500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to glass bowl (highlighted by a red box)? Select from chair (highlighted by a blue box) and tablecloth (highlighted by a green box).\n(A) chair\n(B) tablecloth" }, { "from": "gpt", "value": "(B) tablecloth" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828554_101453015545541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to curtain (highlighted by a red box), cardboard box (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) cardboard box\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446497_357486933504583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, shower door (highlighted by a red box) or shower curtain (highlighted by a blue box)?\n(A) shower door\n(B) shower curtain" }, { "from": "gpt", "value": "(B) shower curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458519_113893548248125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of door (annotated by the red box) in relation to robe? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430858_74487492394541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from screen door (highlighted by a red box)? Choose among these: mat (highlighted by a blue box) or mirror (highlighted by a green box).\n(A) mat\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018155_373338272768333_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670350_67502582196749_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of picture frame (annotated by the red box) in reference to table?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444501_2424811550958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, pillow (highlighted by a red box) or table (highlighted by a blue box)?\n(A) pillow\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445471_150989524809166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) window\n(B) counter top" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_4794198488708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or table (highlighted by a blue box)?\n(A) picture frame\n(B) table" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261228_13798715892958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to picture frame (highlighted by a red box)? flower (highlighted by a blue box) or chest of drawers (highlighted by a green box).\n(A) flower\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898256_696466039751541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, furniture (highlighted by a red box) or bowl (highlighted by a blue box)?\n(A) furniture\n(B) bowl" }, { "from": "gpt", "value": "(B) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458451_118208526057875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or kitchen & dining room table (highlighted by a blue box)?\n(A) chair\n(B) kitchen & dining room table" }, { "from": "gpt", "value": "(B) kitchen & dining room table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828504_102350069505583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) chair\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899112_128870182212833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, countertop (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) countertop\n(B) bottle" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430808_64042304375583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) door\n(B) mat" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331091_134626711461166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from storage box (highlighted by a red box), shelf (highlighted by a blue box) or storage box (highlighted by a green box)?\n(A) shelf\n(B) storage box" }, { "from": "gpt", "value": "(B) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261317_23581484409958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from chair (highlighted by a red box)? Choose from concrete (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) concrete\n(B) pillow" }, { "from": "gpt", "value": "(A) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898651_572805818758375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window screen (highlighted by a red box), table (highlighted by a blue box) or television (highlighted by a green box)?\n(A) table\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670038_32932029503541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bottle (highlighted by a red box)? Select from bottle (highlighted by a blue box) and book (highlighted by a green box).\n(A) bottle\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446444_82615008002208_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018699_544750342977083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333319_28605338375583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, lamp (highlighted by a red box) or vase (highlighted by a blue box)?\n(A) lamp\n(B) vase" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444703_73411766102791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, table lamp (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_4886195427875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), curtain (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) curtain\n(B) chair" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331587_15971987228625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from nightstand (highlighted by a red box)? Select from bed (highlighted by a blue box) and book (highlighted by a green box).\n(A) bed\n(B) book" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431138_351209681034208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the door (highlighted by a red box)? stair (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) stair\n(B) cabinetry" }, { "from": "gpt", "value": "(A) stair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895446_129402894102333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, counter top (highlighted by a red box) or glass vase (highlighted by a blue box)?\n(A) counter top\n(B) glass vase" }, { "from": "gpt", "value": "(A) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739919_16201972892500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to side table (highlighted by a red box)? Select from window (highlighted by a blue box) and radiator (highlighted by a green box).\n(A) window\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331177_277410198637208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898203_145878379506875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, floral arrangement (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) floral arrangement\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447308_409776167375666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window frame (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) window frame\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899031_643171024793166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, coffee cup (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) coffee cup\n(B) toy" }, { "from": "gpt", "value": "(A) coffee cup" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333512_48561494066458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from electric outlet (highlighted by a red box)? Select from window (highlighted by a blue box) and window sill (highlighted by a green box).\n(A) window\n(B) window sill" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334754_421205712835125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window sill (highlighted by a red box) or wide (highlighted by a blue box)?\n(A) window sill\n(B) wide" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430683_326412178963791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhere is chair (annotated by the red box) located in relation to table in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334837_613727254695541_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bed (highlighted by a red box)? doormat (highlighted by a blue box) or cupboard (highlighted by a green box).\n(A) doormat\n(B) cupboard" }, { "from": "gpt", "value": "(A) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663250_75034082397000_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331173_276409692522833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bookshelf (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) bookshelf\n(B) chair" }, { "from": "gpt", "value": "(A) bookshelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458221_76870971467250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to garbage (highlighted by a red box)? Select from desk (highlighted by a blue box) and chair (highlighted by a green box).\n(A) desk\n(B) chair" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430822_67731770787874_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444735_77877097386500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, screen door (highlighted by a red box) or christmas tree (highlighted by a blue box)?\n(A) screen door\n(B) christmas tree" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670197_53472210977916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, guitar (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) guitar\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331294_14701241027083_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458231_78585995369875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bowl (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) bowl\n(B) houseplant" }, { "from": "gpt", "value": "(A) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896122_145800122651541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) furniture\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430068_34719380618290_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670133_40029871972250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is door (annotated by the red box) located relative to exhaust hood? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429826_746698897539833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toiletry (highlighted by a red box)? toiletry (highlighted by a blue box) or toiletry (highlighted by a green box).\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331921_630963893843291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is book (annotated by the red box) located in relation to book in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018304_109020489147458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to shelf (highlighted by a red box)? Select from bottle (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334227_106994306897416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from accessory (highlighted by a red box)? Choose from cabinet (highlighted by a blue box) and shelf (highlighted by a green box).\n(A) cabinet\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331946_165358521205041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431120_348924031379500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, appliance (highlighted by a red box) or countertop (highlighted by a blue box)?\n(A) appliance\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358295_15817058182958_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333561_200733775552875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from cleaning product (highlighted by a red box)? Choose among these: toothpaste (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) toothpaste\n(B) cabinetry" }, { "from": "gpt", "value": "(A) toothpaste" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447226_212418412493000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the washing machine (highlighted by a red box)? Choose among these: dish washer (highlighted by a blue box) or laundry (highlighted by a green box).\n(A) dish washer\n(B) laundry" }, { "from": "gpt", "value": "(B) laundry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669936_14795892478916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to door (highlighted by a red box)? Choose from door (highlighted by a blue box) and shelf (highlighted by a green box).\n(A) door\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670315_64435332206458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from lamp (highlighted by a red box)? Select from candle holder (highlighted by a blue box) and armchair (highlighted by a green box).\n(A) candle holder\n(B) armchair" }, { "from": "gpt", "value": "(B) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670350_67504581406957_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table lamp (highlighted by a red box) or table (highlighted by a blue box)?\n(A) table lamp\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332201_264274279744457_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from tile (highlighted by a red box), kitchen appliance (highlighted by a blue box) or countertop (highlighted by a green box)?\n(A) kitchen appliance\n(B) countertop" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898247_167674830092458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to picture frame (highlighted by a red box), table (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) table\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662891_19509493012791_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333061_60747864758791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663064_38456495992833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, electric outlet (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) electric outlet\n(B) cabinetry" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334672_391426114070000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, furniture (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) furniture\n(B) appliance" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354549021329708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, screen door (highlighted by a red box) or balustrade (highlighted by a blue box)?\n(A) screen door\n(B) balustrade" }, { "from": "gpt", "value": "(B) balustrade" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24800505364666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, laptop (highlighted by a red box) or coffee table (highlighted by a blue box)?\n(A) laptop\n(B) coffee table" }, { "from": "gpt", "value": "(A) laptop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896199_142403147133125_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796279_850668839416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window screen (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) window screen\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458706_136826459207000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is electric outlet (annotated by the red box) located relative to cabinetry? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898350_511470781439250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to chair (highlighted by a red box)? Select from chair (highlighted by a blue box) and table (highlighted by a green box).\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899663_234340471399666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358645_3286233010416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, lamp (highlighted by a red box) or elevator (highlighted by a blue box)?\n(A) lamp\n(B) elevator" }, { "from": "gpt", "value": "(B) elevator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446050_79834858376875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, mirror (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) mirror\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662962_24718484784916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, faucet (highlighted by a red box) or plywood (highlighted by a blue box)?\n(A) faucet\n(B) plywood" }, { "from": "gpt", "value": "(B) plywood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358693_3164727516416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, armoire (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) armoire\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445125_5216024645625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or table (highlighted by a blue box)?\n(A) door\n(B) table" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670293_62014916898541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, faucet (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) faucet\n(B) cabinetry" }, { "from": "gpt", "value": "(A) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670133_40019775963958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to radiator (highlighted by a red box)? Choose from chest of drawers (highlighted by a blue box) and chest of drawers (highlighted by a green box).\n(A) chest of drawers\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358700_5240660033041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331343_192435418862333_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429846_11712463894791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or door (highlighted by a blue box)?\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670288_62151213011583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, houseplant (highlighted by a red box) or dresser (highlighted by a blue box)?\n(A) houseplant\n(B) dresser" }, { "from": "gpt", "value": "(B) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332207_264511783409875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from shelf (highlighted by a red box)? Select from chair (highlighted by a blue box) and studio couch (highlighted by a green box).\n(A) chair\n(B) studio couch" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447287_408776600915833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, kitchen appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) kitchen appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896429_19294548099083_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018750_7061265604541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, cabinetry (highlighted by a red box) or bar stool (highlighted by a blue box)?\n(A) cabinetry\n(B) bar stool" }, { "from": "gpt", "value": "(B) bar stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896310_6763731044750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the shelf (highlighted by a red box)? book (highlighted by a blue box) or table (highlighted by a green box).\n(A) book\n(B) table" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649408_10080395042875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to book (highlighted by a red box)? table (highlighted by a blue box) or book (highlighted by a green box).\n(A) table\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649742_49616988542791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018746_7254753670375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from armchair (highlighted by a red box)? armchair (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) armchair\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331158_181714612300958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, furniture (highlighted by a red box) or stairwell (highlighted by a blue box)?\n(A) furniture\n(B) stairwell" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332026_202803500533916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or door (highlighted by a blue box)?\n(A) cabinetry\n(B) door" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331922_630801792414666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of computer monitor (annotated by the red box) in relation to shelf? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429771_360039019518166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to lamp (highlighted by a red box)? picture frame (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) picture frame\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446561_86531474262458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) door\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204589_551214537250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) picture frame\n(B) screen door" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333110_108779887261708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from book (highlighted by a red box)? chair (highlighted by a blue box) or book (highlighted by a green box)?\n(A) chair\n(B) book" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017829_696884865871000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, appliance (highlighted by a red box) or table (highlighted by a blue box)?\n(A) appliance\n(B) table" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898340_508405004669875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, file cabinet (highlighted by a red box) or towel (highlighted by a blue box)?\n(A) file cabinet\n(B) towel" }, { "from": "gpt", "value": "(A) file cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897745_115957765646125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toilet (highlighted by a red box)? soap dispenser (highlighted by a blue box) or sink (highlighted by a green box).\n(A) soap dispenser\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331507_155048409173041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) window\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261675_3125442402125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chest of drawer (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) chest of drawer\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895614_470391492750291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) chair\n(B) bottle" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332183_262706613132625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from glass door (highlighted by a red box)? furniture (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) furniture\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261269_13836501111750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334728_535747027042833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, television (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) television\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898256_696442032896208_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669927_14284959071416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to houseplant (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471469816285416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to backpack (highlighted by a red box), chair (highlighted by a blue box) or box (highlighted by a green box)?\n(A) chair\n(B) box" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897512_472718499008666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to box (highlighted by a red box), box (highlighted by a blue box) or box (highlighted by a green box)?\n(A) box\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899270_883837296115541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, mouthwash (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) mouthwash\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334209_105614099961250_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444907_106168757590375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331522_190756283502083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to oven (highlighted by a red box)? Select from wok (highlighted by a blue box) and countertop (highlighted by a green box).\n(A) wok\n(B) countertop" }, { "from": "gpt", "value": "(A) wok" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332158_260211038286708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or handle (highlighted by a blue box)?\n(A) table\n(B) handle" }, { "from": "gpt", "value": "(B) handle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897951_533512337866375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of bath towel (annotated by the red box) and screen door in the image provided, where is bath towel (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444696_72546774303125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to kitchen appliance (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and toaster (highlighted by a green box).\n(A) cabinetry\n(B) toaster" }, { "from": "gpt", "value": "(B) toaster" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447210_209240768984958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door handle (highlighted by a red box) or shower (highlighted by a blue box)?\n(A) door handle\n(B) shower" }, { "from": "gpt", "value": "(B) shower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897523_472471001098958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to storage box (highlighted by a red box)? storage box (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) storage box\n(B) shelf" }, { "from": "gpt", "value": "(A) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896195_142288042718166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, door (highlighted by a red box) or mattress (highlighted by a blue box)?\n(A) door\n(B) mattress" }, { "from": "gpt", "value": "(B) mattress" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358278_8990921900083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, kitchen appliance (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) kitchen appliance\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018307_109052776128416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, houseplant (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) houseplant\n(B) chair" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898782_67466106026708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) chair\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896063_132118989728833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to picture frame (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445680_62000352339958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, basin (highlighted by a red box) or writing (highlighted by a blue box)?\n(A) basin\n(B) writing" }, { "from": "gpt", "value": "(A) basin" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895868_107570773733541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, remote (highlighted by a red box) or remote (highlighted by a blue box)?\n(A) remote\n(B) remote" }, { "from": "gpt", "value": "(B) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899913_1028332854259333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is bathrobe (annotated by the red box) located relative to curtain?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898587_184449778703125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of pillow (annotated by the red box) in relation to chair?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898236_167730724630125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or remote control (highlighted by a blue box)?\n(A) picture frame\n(B) remote control" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649707_47765754332166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window screen (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) window screen\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261167_1330261217750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from door (highlighted by a red box), chair (highlighted by a blue box) or radiator (highlighted by a green box)?\n(A) chair\n(B) radiator" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899898_1027058731105875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to window (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and blind (highlighted by a green box).\n(A) furniture\n(B) blind" }, { "from": "gpt", "value": "(B) blind" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458286_76238031522541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cabinetry (highlighted by a red box)? curtain (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) curtain\n(B) chair" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670158_40735942399833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cabinetry (highlighted by a red box) or floral arrangement (highlighted by a blue box)?\n(A) cabinetry\n(B) floral arrangement" }, { "from": "gpt", "value": "(B) floral arrangement" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898701_580969986329625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, countertop (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) countertop\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649720_47932951496166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, bed (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) bed\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018746_7246756922208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895274_79080915176333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the book (highlighted by a red box)? book (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) book\n(B) cabinetry" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739313_44860010362458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, fireplace (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) fireplace\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358253_6203043132708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, book (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) book\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899936_863329469012750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896031_129145828114416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to studio couch (highlighted by a red box)? curtain (highlighted by a blue box) or plain (highlighted by a green box).\n(A) curtain\n(B) plain" }, { "from": "gpt", "value": "(B) plain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334487_104569624102208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, footwear (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) footwear\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669880_11262306994250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bar stool (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) bar stool\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739821_16242189978083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bed (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) bed\n(B) fireplace" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828476_100625052464125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or book (highlighted by a blue box)?\n(A) picture frame\n(B) book" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898720_582956273028208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to mirror (highlighted by a red box)? radiator (highlighted by a blue box) or door (highlighted by a green box).\n(A) radiator\n(B) door" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739600_199500486118000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table lamp (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) table lamp\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446574_86372073588666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chair (highlighted by a red box)? houseplant (highlighted by a blue box) or path (highlighted by a green box)?\n(A) houseplant\n(B) path" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115358_4221801410958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chandelier (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) chandelier\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899477_954243527996250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to picture frame (highlighted by a red box)? lamp (highlighted by a blue box) or mirror (highlighted by a green box).\n(A) lamp\n(B) mirror" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334733_535857432191250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) chair\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334464_100898685152208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, electric outlet (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) electric outlet\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332810_48142330856833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from kitchen knife (highlighted by a red box)? Choose among these: kitchen knife (highlighted by a blue box) or countertop (highlighted by a green box).\n(A) kitchen knife\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737864531616791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or design (highlighted by a blue box)?\n(A) door\n(B) design" }, { "from": "gpt", "value": "(B) design" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332075_251523430755541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, counter top (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) counter top\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115205_95113828198458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to tablet computer (highlighted by a red box)? Choose from cloth (highlighted by a blue box) and electric outlet (highlighted by a green box).\n(A) cloth\n(B) electric outlet" }, { "from": "gpt", "value": "(A) cloth" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899284_885326352494916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window (highlighted by a red box)? Select from counter top (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) counter top\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896055_131933196613000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the table (highlighted by a red box)? alcohol (highlighted by a blue box) or chair (highlighted by a green box).\n(A) alcohol\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430269_185589618645166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cupboard (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cupboard\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334057_86292890047750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331187_278083195038291_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333785_48860573193583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, houseplant (highlighted by a red box) or refrigerator (highlighted by a blue box)?\n(A) houseplant\n(B) refrigerator" }, { "from": "gpt", "value": "(B) refrigerator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739563_198334154206375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, sink (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) sink\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334559_68602629405625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window screen (highlighted by a red box)? Select from computer keyboard (highlighted by a blue box) and computer monitor (highlighted by a green box).\n(A) computer keyboard\n(B) computer monitor" }, { "from": "gpt", "value": "(A) computer keyboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446588_206025142930458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, mechanical fan (highlighted by a red box) or blanket (highlighted by a blue box)?\n(A) mechanical fan\n(B) blanket" }, { "from": "gpt", "value": "(B) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444887_102501993576875_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444738_77948401499625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chest of drawers (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chest of drawers\n(B) chair" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896205_2100284751540_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from door (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and door (highlighted by a green box).\n(A) cabinetry\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204305_15364280252875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to studio couch (highlighted by a red box), plaid (highlighted by a blue box) or studio couch (highlighted by a green box)?\n(A) plaid\n(B) studio couch" }, { "from": "gpt", "value": "(A) plaid" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261344_24165349651208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) chair\n(B) armchair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895912_111393951123750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bottle (highlighted by a red box) or rail (highlighted by a blue box)?\n(A) bottle\n(B) rail" }, { "from": "gpt", "value": "(B) rail" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796466_3723802268208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of toilet (annotated by the red box) and cleaning product in the image provided, where is toilet (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649722_48873708972500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window (highlighted by a red box) or window (highlighted by a blue box)?\n(A) window\n(B) window" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458366_100784551271666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the curtain (highlighted by a red box)? television (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) television\n(B) picture frame" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458202_74813071413625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from picture frame (highlighted by a red box), book (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) book\n(B) picture frame" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828340_78855434956666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from radiator (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204921_3704989957166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, lamp (highlighted by a red box) or dark (highlighted by a blue box)?\n(A) lamp\n(B) dark" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204376_18255724764791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, houseplant (highlighted by a red box) or window frame (highlighted by a blue box)?\n(A) houseplant\n(B) window frame" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896063_131998987249583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from bottle (highlighted by a red box), bottle (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471593814668916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to chair (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and window screen (highlighted by a green box).\n(A) cabinetry\n(B) window screen" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358362_16230162903583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, person (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) person\n(B) furniture" }, { "from": "gpt", "value": "(A) person" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333665_131877900640957_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332758_43221331391500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cleaning product (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) cleaning product\n(B) toiletry" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261096_1210454147500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, sink (highlighted by a red box) or apple (highlighted by a blue box)?\n(A) sink\n(B) apple" }, { "from": "gpt", "value": "(B) apple" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899498_197881543443541_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739301_43617268499041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, appliance (highlighted by a red box) or faucet (highlighted by a blue box)?\n(A) appliance\n(B) faucet" }, { "from": "gpt", "value": "(B) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458633_127536276490708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, basket (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) basket\n(B) footwear" }, { "from": "gpt", "value": "(A) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896351_18718905407166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or television (highlighted by a blue box)?\n(A) picture frame\n(B) television" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115427_4887614905416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from light fixture (highlighted by a red box)? Choose among these: window (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) window\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332696_107006295215833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) table\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796562_15986478530041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the paper towel (highlighted by a red box)? electric outlet (highlighted by a blue box) or loudspeaker (highlighted by a green box).\n(A) electric outlet\n(B) loudspeaker" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649707_47743746798916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is toaster (annotated by the red box) located in relation to kitchen appliance in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115217_94920742166583_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333778_48255630726041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to basket (highlighted by a red box)? box (highlighted by a blue box) or box (highlighted by a green box).\n(A) box\n(B) box" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430092_28738177182958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhere is toy (annotated by the red box) located in relation to toy in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899953_865675652522333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, drawer (highlighted by a red box) or equipment (highlighted by a blue box)?\n(A) drawer\n(B) equipment" }, { "from": "gpt", "value": "(A) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204864_2774159833000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from radiator (highlighted by a red box)? appliance (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429721_18044745730833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cabinetry (highlighted by a red box) or washing machine (highlighted by a blue box)?\n(A) cabinetry\n(B) washing machine" }, { "from": "gpt", "value": "(B) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333840_54026880463375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from door (highlighted by a red box), laundry (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) laundry\n(B) furniture" }, { "from": "gpt", "value": "(A) laundry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446050_79836957507250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or trash bin/can (highlighted by a blue box)?\n(A) furniture\n(B) trash bin/can" }, { "from": "gpt", "value": "(B) trash bin/can" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333110_108851191627166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the table (highlighted by a red box)? chair (highlighted by a blue box) or paperback book (highlighted by a green box).\n(A) chair\n(B) paperback book" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663065_38381992125791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, dog (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) dog\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429822_744777299056333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, television (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) television\n(B) armchair" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446142_140976765074000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or stool (highlighted by a blue box)?\n(A) chair\n(B) stool" }, { "from": "gpt", "value": "(B) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669881_10994912990333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, studio couch (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) studio couch\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204739_24133843038375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from curtain (highlighted by a red box)? window sill (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) window sill\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896429_19224442503625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window sill (highlighted by a red box), chest of drawers (highlighted by a blue box) or bed (highlighted by a green box)?\n(A) chest of drawers\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204392_22940084749500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from toy (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and parrot (highlighted by a green box).\n(A) picture frame\n(B) parrot" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897712_112131295048125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, radiator (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) radiator\n(B) ceramic tile" }, { "from": "gpt", "value": "(B) ceramic tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204656_10849765677541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, home appliance (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) home appliance\n(B) glass door" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898687_577221415307125_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333233_32399974904333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430978_101860532577750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table (highlighted by a red box) or magazine (highlighted by a blue box)?\n(A) table\n(B) magazine" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444789_50565400890458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cabinetry (highlighted by a red box) or microwave oven (highlighted by a blue box)?\n(A) cabinetry\n(B) microwave oven" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204585_578520411791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, footwear (highlighted by a red box) or door (highlighted by a blue box)?\n(A) footwear\n(B) door" }, { "from": "gpt", "value": "(A) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662891_19499497155000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from shop window (highlighted by a red box)? Choose among these: screen door (highlighted by a blue box) or cardboard box (highlighted by a green box).\n(A) screen door\n(B) cardboard box" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358698_3068715523750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to coffee table (highlighted by a red box), studio couch (highlighted by a blue box) or studio couch (highlighted by a green box)?\n(A) studio couch\n(B) studio couch" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115574_2505203809833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, desk (highlighted by a red box) or door (highlighted by a blue box)?\n(A) desk\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334213_105747295879375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, lamp (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) lamp\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649647_40338927042083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from mouthwash (highlighted by a red box)? toothbrush (highlighted by a blue box) or mirror (highlighted by a green box)?\n(A) toothbrush\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358340_15279319222875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to chair (highlighted by a red box), paper towel (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) paper towel\n(B) appliance" }, { "from": "gpt", "value": "(A) paper towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458717_137701103972000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, curtain (highlighted by a red box) or bathtub (highlighted by a blue box)?\n(A) curtain\n(B) bathtub" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260957_5950296027583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, table (highlighted by a red box) or door (highlighted by a blue box)?\n(A) table\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898510_160651689646375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bookcase (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) bookcase\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430314_264803044803750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, furniture (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) furniture\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331232_283359727495541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from toiletry (highlighted by a red box)? Choose among these: mirror (highlighted by a blue box) or balustrade (highlighted by a green box).\n(A) mirror\n(B) balustrade" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897512_472710502310041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: storage box (highlighted by a blue box) or storage box (highlighted by a green box).\n(A) storage box\n(B) storage box" }, { "from": "gpt", "value": "(A) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204322_15976059123208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, mirror (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) mirror\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444872_98060177651291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446462_354234433185875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, curtain (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) curtain\n(B) chair" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896395_22728263365875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the oil lamp (highlighted by a red box)? nightstand (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333031_59044929276791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, coffee table (highlighted by a red box) or couple (highlighted by a blue box)?\n(A) coffee table\n(B) couple" }, { "from": "gpt", "value": "(A) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358362_16162156593583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to chest of drawers (highlighted by a red box), chair (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430599_315408320753416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to speaker (highlighted by a red box)? desk (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) desk\n(B) shelf" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663330_77393871408875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, door (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) door\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_4970195507291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table (highlighted by a red box) or bowl (highlighted by a blue box)?\n(A) table\n(B) bowl" }, { "from": "gpt", "value": "(B) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446479_355576757801666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is swivel chair (annotated by the red box) located in relation to pillow in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796562_15974483496375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from swivel chair (highlighted by a red box)? Choose from table (highlighted by a blue box) and chair (highlighted by a green box).\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895591_1161456580986208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, exhaust hood (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) exhaust hood\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895465_130587214148083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from gas stove (highlighted by a red box), blanket (highlighted by a blue box) or oven (highlighted by a green box)?\n(A) blanket\n(B) oven" }, { "from": "gpt", "value": "(A) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333233_32325471561541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhere is furniture (annotated by the red box) located in relation to luggage and bags in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333561_200731776359583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, washing machine (highlighted by a red box) or laundry (highlighted by a blue box)?\n(A) washing machine\n(B) laundry" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334074_88942773634791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, mirror (highlighted by a red box) or face powder (highlighted by a blue box)?\n(A) mirror\n(B) face powder" }, { "from": "gpt", "value": "(B) face powder" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649743_49715897393541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, filing cabinet (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) filing cabinet\n(B) table lamp" }, { "from": "gpt", "value": "(A) filing cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445597_284964732981458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chest of drawers (highlighted by a red box) or plain (highlighted by a blue box)?\n(A) chest of drawers\n(B) plain" }, { "from": "gpt", "value": "(B) plain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431136_351148772785291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of toy (annotated by the red box) in reference to toy? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334066_87340616581875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to glass jar (highlighted by a red box), product (highlighted by a blue box) or cleaning product (highlighted by a green box)?\n(A) product\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796464_3570599040250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, medicine cabinet (highlighted by a red box) or bathtub (highlighted by a blue box)?\n(A) medicine cabinet\n(B) bathtub" }, { "from": "gpt", "value": "(A) medicine cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018817_20129047444208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, sink (highlighted by a red box) or toilet (highlighted by a blue box)?\n(A) sink\n(B) toilet" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662951_24355229952041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), pillow (highlighted by a blue box) or shoe (highlighted by a green box)?\n(A) pillow\n(B) shoe" }, { "from": "gpt", "value": "(B) shoe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334938_663153289940083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) chair\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445639_58324769746916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from chest of drawers (highlighted by a red box)? Choose from table lamp (highlighted by a blue box) and nightstand (highlighted by a green box).\n(A) table lamp\n(B) nightstand" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796505_3380419233666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to bookshelf (highlighted by a red box), picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458607_125627591132583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, light fixture (highlighted by a red box) or bathrobe (highlighted by a blue box)?\n(A) light fixture\n(B) bathrobe" }, { "from": "gpt", "value": "(A) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430844_70994746811208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bathtub (highlighted by a red box) or window (highlighted by a blue box)?\n(A) bathtub\n(B) window" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737826330384875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from wood (highlighted by a red box)? screen door (highlighted by a blue box) or radiator (highlighted by a green box)?\n(A) screen door\n(B) radiator" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896587_32931240813416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) door\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896101_145171204589583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from chest of drawers (highlighted by a red box)? Choose from speaker (highlighted by a blue box) and television (highlighted by a green box).\n(A) speaker\n(B) television" }, { "from": "gpt", "value": "(A) speaker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670053_33978854840624_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is bathroom cabinet (annotated by the red box) located relative to sink? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334849_615479344937125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cabinetry (highlighted by a red box) or soap dispenser (highlighted by a blue box)?\n(A) cabinetry\n(B) soap dispenser" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895245_75748783942916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, book (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) book\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261515_43667838305083_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115504_12326320558500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bookcase (highlighted by a red box) or swivel chair (highlighted by a blue box)?\n(A) bookcase\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444499_2463112498583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or window (highlighted by a blue box)?\n(A) picture frame\n(B) window" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896365_19919840505583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the window (highlighted by a red box)? coffee maker (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) coffee maker\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444733_78047993879666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, box (highlighted by a red box) or animal (highlighted by a blue box)?\n(A) box\n(B) animal" }, { "from": "gpt", "value": "(B) animal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331909_627494472729625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) door\n(B) screen door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796366_10592446400333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or computer keyboard (highlighted by a blue box)?\n(A) picture frame\n(B) computer keyboard" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899654_233414279776166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the stationary bicycle (highlighted by a red box)? Choose among these: curtain (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) curtain\n(B) curtain" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896117_145976516191666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chest of drawers (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) chest of drawers\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115415_4121960771082_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, pillow (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) pillow\n(B) mat" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358624_431307137583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, screen door (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) screen door\n(B) footwear" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429884_367778129115291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from open (highlighted by a red box)? cabinetry (highlighted by a blue box) or radiator (highlighted by a green box)?\n(A) cabinetry\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204303_14979573485375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bowl (highlighted by a red box)? curtain (highlighted by a blue box) or chair (highlighted by a green box).\n(A) curtain\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669881_11006908242625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from cabinetry (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332648_369079267288625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to computer keyboard (highlighted by a red box), houseplant (highlighted by a blue box) or desk (highlighted by a green box)?\n(A) houseplant\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669939_15270939044083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, cocktail table (highlighted by a red box) or blind (highlighted by a blue box)?\n(A) cocktail table\n(B) blind" }, { "from": "gpt", "value": "(A) cocktail table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458451_118244527795250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from window (highlighted by a red box)? Choose from curtain (highlighted by a blue box) and desk (highlighted by a green box).\n(A) curtain\n(B) desk" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018071_98167378116666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bathtub (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) bathtub\n(B) bath mat" }, { "from": "gpt", "value": "(B) bath mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649807_46781389465166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from picture frame (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) cabinetry\n(B) picture frame" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115416_4073763158750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, coffee table (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) coffee table\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332400_405814768378333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table (highlighted by a red box) or refrigerator (highlighted by a blue box)?\n(A) table\n(B) refrigerator" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204304_15104171836375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the desk (highlighted by a red box)? Choose among these: houseplant (highlighted by a blue box) or bay window (highlighted by a green box).\n(A) houseplant\n(B) bay window" }, { "from": "gpt", "value": "(B) bay window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115504_12258314123833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table (highlighted by a red box) or book (highlighted by a blue box)?\n(A) table\n(B) book" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331220_282481911891666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, screen door (highlighted by a red box) or mirror (highlighted by a blue box)?\n(A) screen door\n(B) mirror" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334627_386295830347166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739919_16209969729041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is chest of drawers (annotated by the red box) located relative to drawer? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445697_62771802935958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, lamp (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) lamp\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739275_42662861900750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), window screen (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) window screen\n(B) chair" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739931_16615710974416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toilet (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) toilet\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739329_45581717581916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window sill (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) window sill\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261206_11668478592250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, nightstand (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) nightstand\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669880_11188303035958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to appliance (highlighted by a red box), appliance (highlighted by a blue box) or kitchen appliance (highlighted by a green box)?\n(A) appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204786_27323572540166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430287_186526872609625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446485_355920350625250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445841_69180352487540_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, shelf (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) shelf\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430924_93048075142208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, writing desk (highlighted by a red box) or person (highlighted by a blue box)?\n(A) writing desk\n(B) person" }, { "from": "gpt", "value": "(A) writing desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899030_643007077162833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the fabric (highlighted by a red box)? chair (highlighted by a blue box) or chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331049_482452823425125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from furniture (highlighted by a red box)? door (highlighted by a blue box) or door (highlighted by a green box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445790_67197608807458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from dirt (highlighted by a red box)? glass door (highlighted by a blue box) or door (highlighted by a green box)?\n(A) glass door\n(B) door" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445954_129838457612625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, studio couch (highlighted by a red box) or dresser (highlighted by a blue box)?\n(A) studio couch\n(B) dresser" }, { "from": "gpt", "value": "(B) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458561_128045224444125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, door (highlighted by a red box) or hardwood (highlighted by a blue box)?\n(A) door\n(B) hardwood" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429753_355350991950750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to picture frame (highlighted by a red box)? Choose from book (highlighted by a blue box) and table (highlighted by a green box).\n(A) book\n(B) table" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333624_77205660062416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bed frame (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) bed frame\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018415_394365220350250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to table (highlighted by a red box)? Select from wide (highlighted by a blue box) and wrapping paper (highlighted by a green box).\n(A) wide\n(B) wrapping paper" }, { "from": "gpt", "value": "(A) wide" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895249_75822087227166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to stool (highlighted by a red box), mat (highlighted by a blue box) or desk (highlighted by a green box)?\n(A) mat\n(B) desk" }, { "from": "gpt", "value": "(A) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018508_530446799875958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, faucet (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) faucet\n(B) toiletry" }, { "from": "gpt", "value": "(A) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796438_692613093041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) picture frame\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445736_64093493822500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, toaster (highlighted by a red box) or counter (highlighted by a blue box)?\n(A) toaster\n(B) counter" }, { "from": "gpt", "value": "(B) counter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333812_52177754538625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, round table (highlighted by a red box) or keyboard (highlighted by a blue box)?\n(A) round table\n(B) keyboard" }, { "from": "gpt", "value": "(A) round table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261357_25844225511833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, washing machine (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) washing machine\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332113_684346007613083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, tap (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) tap\n(B) cleaning product" }, { "from": "gpt", "value": "(A) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670075_38521503180375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898261_696805033897625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the computer (highlighted by a red box)? Choose among these: computer keyboard (highlighted by a blue box) or desk (highlighted by a green box).\n(A) computer keyboard\n(B) desk" }, { "from": "gpt", "value": "(A) computer keyboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261666_2570948776125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, basket (highlighted by a red box) or brush (highlighted by a blue box)?\n(A) basket\n(B) brush" }, { "from": "gpt", "value": "(A) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899630_229919273134375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is appliance (annotated by the red box) located relative to electric outlet? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358173_62457029457000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is floral arrangement (annotated by the red box) located in relation to lamp in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895577_1155258153289166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, towel bar (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) towel bar\n(B) toiletry" }, { "from": "gpt", "value": "(A) towel bar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828439_90625936335541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from tap (highlighted by a red box)? Choose among these: home appliance (highlighted by a blue box) or window (highlighted by a green box).\n(A) home appliance\n(B) window" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458706_136824459998250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, electric outlet (highlighted by a red box) or fridge (highlighted by a blue box)?\n(A) electric outlet\n(B) fridge" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332467_886376772838458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from shelf (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670288_62098317256458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, cabinetry (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) cabinetry\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896133_147127414196000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) chair\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458330_103007712709708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from table (highlighted by a red box)? Select from side table (highlighted by a blue box) and mat (highlighted by a green box).\n(A) side table\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115448_11736251052125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bag (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and window (highlighted by a green box).\n(A) furniture\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458506_113212671101125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, shelf (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) shelf\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333308_28019344483291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, kitchen appliance (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) kitchen appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662835_15850652478000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the picture frame (highlighted by a red box)? floral arrangement (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) floral arrangement\n(B) picture frame" }, { "from": "gpt", "value": "(A) floral arrangement" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897945_351496703862291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of electric outlet (annotated by the red box) in relation to furniture?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334024_271720791872708_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739749_4263494756166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bath towel (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) bath towel\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204474_25049584151958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, lamp (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) lamp\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429822_744680705198916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from houseplant (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and bedside lamp (highlighted by a green box).\n(A) pillow\n(B) bedside lamp" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899573_959584535206583_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332075_251523430755541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from mouthwash (highlighted by a red box)? bottle (highlighted by a blue box) or toilet paper (highlighted by a green box)?\n(A) bottle\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828449_91307225169291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the lamp (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or lighting (highlighted by a green box).\n(A) picture frame\n(B) lighting" }, { "from": "gpt", "value": "(B) lighting" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739425_191758304232833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to flower (highlighted by a red box)? plant (highlighted by a blue box) or flower (highlighted by a green box).\n(A) plant\n(B) flower" }, { "from": "gpt", "value": "(B) flower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896083_144045900898583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) picture frame\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896404_16673220210832_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window (highlighted by a red box) or beach towel (highlighted by a blue box)?\n(A) window\n(B) beach towel" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898195_145230912344208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of door (annotated by the red box) in reference to radiator? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333293_26474627060791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from stairs (highlighted by a red box)? ladder (highlighted by a blue box) or mirror (highlighted by a green box)?\n(A) ladder\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796744_28926079163250_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897757_117787218165833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, book (highlighted by a red box) or table (highlighted by a blue box)?\n(A) book\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447203_88049079194125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, book (highlighted by a red box) or table (highlighted by a blue box)?\n(A) book\n(B) table" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458366_100806542576083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or television (highlighted by a blue box)?\n(A) picture frame\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018339_117070911625166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bookshelf (highlighted by a red box) or book (highlighted by a blue box)?\n(A) bookshelf\n(B) book" }, { "from": "gpt", "value": "(A) bookshelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898622_757627108810291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897560_473362893579666_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896063_132129002427500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to refrigerator (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and toilet paper (highlighted by a green box).\n(A) cabinetry\n(B) toilet paper" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018119_368557036402583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from utensil (highlighted by a red box)? utensil (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) utensil\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895895_109456112284541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to toiletry (highlighted by a red box)? Select from basin (highlighted by a blue box) and basin (highlighted by a green box).\n(A) basin\n(B) basin" }, { "from": "gpt", "value": "(B) basin" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204322_16054060077125_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898723_582898080279875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table lamp (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) table lamp\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331934_163607785882916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, waste (highlighted by a red box) or waste (highlighted by a blue box)?\n(A) waste\n(B) waste" }, { "from": "gpt", "value": "(B) waste" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333838_54222767576000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828478_100824753055375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to screen door (highlighted by a red box)? towel/napkin (highlighted by a blue box) or radiator (highlighted by a green box).\n(A) towel/napkin\n(B) radiator" }, { "from": "gpt", "value": "(A) towel/napkin" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018273_794972071650375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, lamp (highlighted by a red box) or window (highlighted by a blue box)?\n(A) lamp\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334274_157021469129583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from paper plate (highlighted by a red box)? Select from table (highlighted by a blue box) and platter (highlighted by a green box).\n(A) table\n(B) platter" }, { "from": "gpt", "value": "(B) platter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897512_472748503285791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from toilet paper (highlighted by a red box)? handbag (highlighted by a blue box) or storage box (highlighted by a green box)?\n(A) handbag\n(B) storage box" }, { "from": "gpt", "value": "(A) handbag" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333035_58743234864375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, clothing (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) clothing\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899955_865608863555083_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899900_1026966035836666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, animal (highlighted by a red box) or bay window (highlighted by a blue box)?\n(A) animal\n(B) bay window" }, { "from": "gpt", "value": "(B) bay window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649474_14688626856000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, book (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) book\n(B) pillow" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332066_250010179954208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the table (highlighted by a red box)? mat (highlighted by a blue box) or waste container (highlighted by a green box).\n(A) mat\n(B) waste container" }, { "from": "gpt", "value": "(B) waste container" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332156_260011835600625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) chair\n(B) shelf" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334130_140736368233708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cleaning product (highlighted by a red box) or soap (highlighted by a blue box)?\n(A) cleaning product\n(B) soap" }, { "from": "gpt", "value": "(B) soap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796190_386331816333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bed (highlighted by a red box)? table (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) table\n(B) bottle" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444907_106182052163250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to coffeepot (highlighted by a red box), counter top (highlighted by a blue box) or light switch (highlighted by a green box)?\n(A) counter top\n(B) light switch" }, { "from": "gpt", "value": "(A) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018524_821509998361333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from pillow (highlighted by a red box)? Choose from bed (highlighted by a blue box) and nightstand (highlighted by a green box).\n(A) bed\n(B) nightstand" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430808_64044303567625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or dresser (highlighted by a green box).\n(A) door\n(B) dresser" }, { "from": "gpt", "value": "(B) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430646_323683502357166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhere is desk (annotated by the red box) located in relation to curtain in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261502_42590377456958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the nightstand (highlighted by a red box)? bed (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) bed\n(B) picture frame" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899271_883795096758166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bath (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) bath\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431041_141736061656708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, lamp (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) lamp\n(B) window sill" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204535_2164336874041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or stool (highlighted by a blue box)?\n(A) curtain\n(B) stool" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458262_74167148233458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the wide (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or window screen (highlighted by a green box).\n(A) book\n(B) window screen" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670150_40457635849416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458561_128039226930416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from counter (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or door (highlighted by a green box).\n(A) door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334672_391438109208000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or table (highlighted by a blue box)?\n(A) furniture\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896404_16679217824791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, washing machine (highlighted by a red box) or water heater (highlighted by a blue box)?\n(A) washing machine\n(B) water heater" }, { "from": "gpt", "value": "(B) water heater" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670063_37895521701625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window (highlighted by a red box)? Select from table (highlighted by a blue box) and window (highlighted by a green box).\n(A) table\n(B) window" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261263_13904007766666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of window (annotated by the red box) and shower in the image provided, where is window (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669934_14888189281000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, drawer (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) drawer\n(B) furniture" }, { "from": "gpt", "value": "(A) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796684_30829147805416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, computer monitor (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) computer monitor\n(B) appliance" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204656_10826374930875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of picture frame (annotated by the red box) and light switch in the image provided, where is picture frame (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898448_3326385096250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, corridor (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) corridor\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895912_111388536704125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from hand towel (highlighted by a red box)? tap (highlighted by a blue box) or cleaning product (highlighted by a green box)?\n(A) tap\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018090_104089726618541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, mouthwash (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) mouthwash\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332748_42538411213791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from radiator (highlighted by a red box)? door (highlighted by a blue box) or electric outlet (highlighted by a green box)?\n(A) door\n(B) electric outlet" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334037_278546722588666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to table (highlighted by a red box)? book (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) book\n(B) houseplant" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331432_546061418508374_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, piggy bank (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) piggy bank\n(B) furniture" }, { "from": "gpt", "value": "(A) piggy bank" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895469_132719013854041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333329_30131520432416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the toiletry (highlighted by a red box)? Choose among these: mouthwash (highlighted by a blue box) or cleaning product (highlighted by a green box).\n(A) mouthwash\n(B) cleaning product" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115283_118242731093916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, stool (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) stool\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358105_61795497361833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from animal (highlighted by a red box)? shelf (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) shelf\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017828_696926665527625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, appliance (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) appliance\n(B) radiator" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828390_94739404249750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, pillow (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) pillow\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333283_25437430640166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from picture frame (highlighted by a red box), picture frame (highlighted by a blue box) or bed (highlighted by a green box)?\n(A) picture frame\n(B) bed" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261662_2453963885625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, sink (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) sink\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458714_137767494368332_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, door (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) door\n(B) ceramic tile" }, { "from": "gpt", "value": "(B) ceramic tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896133_147068721873291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, wall clock (highlighted by a red box) or window (highlighted by a blue box)?\n(A) wall clock\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899603_202416140433750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, furniture (highlighted by a red box) or footprint (highlighted by a blue box)?\n(A) furniture\n(B) footprint" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895245_75750783123125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of picture frame (annotated by the red box) and bed in the image provided, where is picture frame (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332557_904970573789041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to coffee cup (highlighted by a red box)? Select from bottle (highlighted by a blue box) and toiletry (highlighted by a green box).\n(A) bottle\n(B) toiletry" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358406_40723374708833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, washing machine (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) washing machine\n(B) counter top" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899057_647052786320000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is furniture (annotated by the red box) located relative to studio couch?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332473_886532176836250_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358118_62519285119333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from pillow (highlighted by a red box)? Choose from clock (highlighted by a blue box) and table (highlighted by a green box).\n(A) clock\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204786_27339565894000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from counter top (highlighted by a red box), light fixture (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) light fixture\n(B) picture frame" }, { "from": "gpt", "value": "(A) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333828_53380650408458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to cleaning product (highlighted by a red box)? Choose from bottle (highlighted by a blue box) and counter top (highlighted by a green box).\n(A) bottle\n(B) counter top" }, { "from": "gpt", "value": "(B) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649742_49592998501750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649634_39403950593625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, studio couch (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) studio couch\n(B) chair" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334754_421185704261583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, houseplant (highlighted by a red box) or heater (highlighted by a blue box)?\n(A) houseplant\n(B) heater" }, { "from": "gpt", "value": "(B) heater" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332751_42639720231583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, home appliance (highlighted by a red box) or laundry (highlighted by a blue box)?\n(A) home appliance\n(B) laundry" }, { "from": "gpt", "value": "(B) laundry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332990_125273300883958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of curtain (annotated by the red box) in relation to curtain?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332184_262576115984916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chest of drawers (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) chest of drawers\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333155_41610225919833_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444706_73266575285166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796521_3967209795125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or lighting (highlighted by a blue box)?\n(A) door\n(B) lighting" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331934_163593791563208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from armchair (highlighted by a red box)? Choose among these: light fixture (highlighted by a blue box) or countertop (highlighted by a green box).\n(A) light fixture\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796475_4216927625958_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358289_15863055737083_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896416_17787030610250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the table lamp (highlighted by a red box)? pillow (highlighted by a blue box) or changing table (highlighted by a green box).\n(A) pillow\n(B) changing table" }, { "from": "gpt", "value": "(B) changing table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018523_821387497996291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, houseplant (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) houseplant\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444514_3833942400291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from screen door (highlighted by a red box)? door (highlighted by a blue box) or door handle (highlighted by a green box)?\n(A) door\n(B) door handle" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898684_576356290135416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to mirror (highlighted by a red box)? toilet paper (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) toilet paper\n(B) screen door" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204350_15536032567166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window frame (highlighted by a red box) or window (highlighted by a blue box)?\n(A) window frame\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649397_9465266027583_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897605_137331645215666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from door (highlighted by a red box)? window (highlighted by a blue box) or bath towel (highlighted by a green box)?\n(A) window\n(B) bath towel" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334754_421187703453083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from couch (highlighted by a red box), pillow (highlighted by a blue box) or radiator (highlighted by a green box)?\n(A) pillow\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899202_186828882035333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cabinetry (highlighted by a red box)? Choose from door (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) door\n(B) screen door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429766_358348249679541_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018068_98200981241208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, shelf (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) shelf\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458221_76852962263583_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896103_145336902505625_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896096_144302794318875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897892_345158510964208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to flag (highlighted by a red box)? picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649639_39639436344166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, armchair (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) armchair\n(B) bottle" }, { "from": "gpt", "value": "(A) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895994_136239216253583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) picture frame\n(B) studio couch" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649802_46919284906416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from table (highlighted by a red box), pillow (highlighted by a blue box) or pad (highlighted by a green box)?\n(A) pillow\n(B) pad" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430262_185409408436208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bed (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) bed\n(B) doormat" }, { "from": "gpt", "value": "(B) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899470_954162127835625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to bean bag chair (highlighted by a red box), television (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) television\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331132_174198648547708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898802_68915395562958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of chest of drawers (annotated by the red box) and computer in the image provided, where is chest of drawers (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899663_234373458281875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, poster (highlighted by a red box) or door (highlighted by a blue box)?\n(A) poster\n(B) door" }, { "from": "gpt", "value": "(A) poster" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261556_75636877101791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toy (highlighted by a red box), toy (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) toy\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331934_163462494718291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, light switch (highlighted by a red box) or light switch (highlighted by a blue box)?\n(A) light switch\n(B) light switch" }, { "from": "gpt", "value": "(A) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430251_182261978274166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from notepad (highlighted by a red box)? Select from table (highlighted by a blue box) and mat (highlighted by a green box).\n(A) table\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358362_16200158157208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, furniture (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) furniture\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895571_1153712444279875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) picture frame\n(B) lamp" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204535_2170334375250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, television (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) television\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24423810001708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or coffee table (highlighted by a blue box)?\n(A) chair\n(B) coffee table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358410_40632678925083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bottle (highlighted by a red box)? Choose among these: beach towel (highlighted by a blue box) or oven (highlighted by a green box).\n(A) beach towel\n(B) oven" }, { "from": "gpt", "value": "(B) oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430248_182353291347125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window (highlighted by a red box) or cupboard (highlighted by a blue box)?\n(A) window\n(B) cupboard" }, { "from": "gpt", "value": "(B) cupboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204381_18117929268833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the chair (highlighted by a red box)? chair (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358647_2937843881666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, countertop (highlighted by a red box) or dish washer (highlighted by a blue box)?\n(A) countertop\n(B) dish washer" }, { "from": "gpt", "value": "(B) dish washer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896589_32971541536791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, lamp (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) lamp\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899030_643015173830583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to book (highlighted by a red box)? Select from book (highlighted by a blue box) and book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261390_27757267956000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) window\n(B) radiator" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333847_75022223249833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), card game (highlighted by a blue box) or table lamp (highlighted by a green box)?\n(A) card game\n(B) table lamp" }, { "from": "gpt", "value": "(A) card game" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895633_471789503963125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the furniture (highlighted by a red box)? cabinetry (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899235_880463326256291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, window blind (highlighted by a red box) or swivel chair (highlighted by a blue box)?\n(A) window blind\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333110_108853190813750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, book (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) book\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669939_15266940625500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to radiator (highlighted by a red box), table (highlighted by a blue box) or table (highlighted by a green box)?\n(A) table\n(B) table" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331934_163532699655208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, book (highlighted by a red box) or plate (highlighted by a blue box)?\n(A) book\n(B) plate" }, { "from": "gpt", "value": "(B) plate" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895826_1219987677093208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, drawer (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) drawer\n(B) window sill" }, { "from": "gpt", "value": "(A) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897979_216956167987250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, appliance (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) appliance\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896096_144118787361250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the chair (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or kitchen appliance (highlighted by a green box).\n(A) cabinetry\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333618_76335435177208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bottle (highlighted by a red box)? Select from bottle (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358460_46701771042875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to throw pillow (highlighted by a red box)? chair (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739256_39604028221791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is screen door (annotated by the red box) located relative to laundry? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662890_19580696815833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to screen door (highlighted by a red box)? electric outlet (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) electric outlet\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663064_38486500791041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from curtain (highlighted by a red box)? Select from window (highlighted by a blue box) and window (highlighted by a green box).\n(A) window\n(B) window" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898235_695683816367916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828361_80295934944041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from table lamp (highlighted by a red box)? door (highlighted by a blue box) or hanger (highlighted by a green box)?\n(A) door\n(B) hanger" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670334_66370195828915_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670184_51716843270500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899664_234691765529791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to stool (highlighted by a red box)? table (highlighted by a blue box) or window screen (highlighted by a green box).\n(A) table\n(B) window screen" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334020_271678192333041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of furniture (annotated by the red box) in reference to comic book? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662870_14574374742750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828233_69848327616583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the picture frame (highlighted by a red box)? Choose among these: toy (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) toy\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332759_43398626279708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the sink (highlighted by a red box)? toothbrush (highlighted by a blue box) or floral arrangement (highlighted by a green box).\n(A) toothbrush\n(B) floral arrangement" }, { "from": "gpt", "value": "(A) toothbrush" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828596_104190764114333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, bed (highlighted by a red box) or door (highlighted by a blue box)?\n(A) bed\n(B) door" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260957_5976302403958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to screen door (highlighted by a red box), window (highlighted by a blue box) or lighting (highlighted by a green box)?\n(A) window\n(B) lighting" }, { "from": "gpt", "value": "(B) lighting" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663398_95012305294958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from curtain (highlighted by a red box)? Choose from window (highlighted by a blue box) and window (highlighted by a green box).\n(A) window\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332397_401430506667583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, pillow (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) pillow\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458693_135282991754416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, desk (highlighted by a red box) or table (highlighted by a blue box)?\n(A) desk\n(B) table" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333329_30095535108416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, product (highlighted by a red box) or product (highlighted by a blue box)?\n(A) product\n(B) product" }, { "from": "gpt", "value": "(A) product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018844_649829315994458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, appliance (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) appliance\n(B) ceramic tile" }, { "from": "gpt", "value": "(B) ceramic tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739459_51667587341375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, stool (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) stool\n(B) chair" }, { "from": "gpt", "value": "(A) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204734_24204347123125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, nightstand (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) nightstand\n(B) table lamp" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331607_18487493686666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445691_57434193892875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from tile (highlighted by a red box)? bottle (highlighted by a blue box) or footwear (highlighted by a green box)?\n(A) bottle\n(B) footwear" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358731_6709814806041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the dresser (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or furniture (highlighted by a green box).\n(A) pillow\n(B) furniture" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204780_27254967696333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from tile (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) chair\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260872_7295552921625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, radiator (highlighted by a red box) or vase (highlighted by a blue box)?\n(A) radiator\n(B) vase" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739276_42739463476875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, curtain (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) curtain\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649586_35281129695083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, window (highlighted by a red box) or dresser (highlighted by a blue box)?\n(A) window\n(B) dresser" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332207_264591767593291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to table (highlighted by a red box), studio couch (highlighted by a blue box) or control (highlighted by a green box)?\n(A) studio couch\n(B) control" }, { "from": "gpt", "value": "(B) control" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670328_65795780942083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to chair (highlighted by a red box)? chair (highlighted by a blue box) or table (highlighted by a green box).\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358386_19294740806666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of rail (annotated by the red box) in reference to stairs? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649478_15067127048833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to chair (highlighted by a red box), furniture (highlighted by a blue box) or paperback book (highlighted by a green box)?\n(A) furniture\n(B) paperback book" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897462_470010061691708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to figurine (highlighted by a red box)? Select from desk (highlighted by a blue box) and box (highlighted by a green box).\n(A) desk\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895618_470338597617375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bottle (highlighted by a red box)? bottle (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334629_386403736478083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from toy (highlighted by a red box)? Select from furniture (highlighted by a blue box) and toy (highlighted by a green box).\n(A) furniture\n(B) toy" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669854_12641451651500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to swivel chair (highlighted by a red box)? Select from chair (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) chair\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332505_343938879779541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24478504253416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window (highlighted by a red box)? Select from couch (highlighted by a blue box) and drawer (highlighted by a green box).\n(A) couch\n(B) drawer" }, { "from": "gpt", "value": "(B) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662891_19503495497958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, ball (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) ball\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333055_60385385251625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is denim jacket (annotated by the red box) located relative to chair?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458607_125651598301458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896379_20376445429291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from pillow (highlighted by a red box)? nightstand (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) nightstand\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445834_68137691477875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to floral arrangement (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018846_649976406055541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from table (highlighted by a red box)? television (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) television\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896097_145235911108791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444706_73228374203375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to window (highlighted by a red box)? cupboard (highlighted by a blue box) or sheet (highlighted by a green box).\n(A) cupboard\n(B) sheet" }, { "from": "gpt", "value": "(B) sheet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898983_823790305372833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445613_56556808446000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, home appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) home appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896031_129181830532875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from desk (highlighted by a red box), houseplant (highlighted by a blue box) or book (highlighted by a green box)?\n(A) houseplant\n(B) book" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649478_14949840144208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, book (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) book\n(B) pillow" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897870_529864755057291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from gas stove (highlighted by a red box)? coffeepot (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) coffeepot\n(B) bottle" }, { "from": "gpt", "value": "(A) coffeepot" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332698_108440750735666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, door (highlighted by a red box) or hoodie (highlighted by a blue box)?\n(A) door\n(B) hoodie" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332207_264605778567040_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, magazine (highlighted by a red box) or table (highlighted by a blue box)?\n(A) magazine\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796722_27618991792083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to kitchen appliance (highlighted by a red box), cabinetry (highlighted by a blue box) or oven (highlighted by a green box)?\n(A) cabinetry\n(B) oven" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897955_216400827692958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the lamp (highlighted by a red box)? Choose among these: television (highlighted by a blue box) or table (highlighted by a green box).\n(A) television\n(B) table" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897434_104247325225541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from furniture (highlighted by a red box), chair (highlighted by a blue box) or electric outlet (highlighted by a green box)?\n(A) chair\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663009_32414515313625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the screen door (highlighted by a red box)? door (highlighted by a blue box) or chair (highlighted by a green box).\n(A) door\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358647_2977843977666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, oven (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) oven\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333946_45889299402583_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334892_623374658134541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from toilet paper (highlighted by a red box)? cupboard (highlighted by a blue box) or toilet paper (highlighted by a green box)?\n(A) cupboard\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334205_103777776869083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to table (highlighted by a red box)? shelf (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) shelf\n(B) shelf" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431120_348914035472958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of light switch (annotated by the red box) in relation to light switch?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261344_24263344219708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from fireplace (highlighted by a red box)? studio couch (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737755025827166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to pillow (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and couch (highlighted by a green box).\n(A) cabinetry\n(B) couch" }, { "from": "gpt", "value": "(B) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897422_104025234290541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) door\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662805_13529982764208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from radiator (highlighted by a red box)? Choose among these: swivel chair (highlighted by a blue box) or door (highlighted by a green box).\n(A) swivel chair\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444750_79624374161375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, oven (highlighted by a red box) or window (highlighted by a blue box)?\n(A) oven\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895274_79151003486208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to oven (highlighted by a red box), banana (highlighted by a blue box) or bar stool (highlighted by a green box)?\n(A) banana\n(B) bar stool" }, { "from": "gpt", "value": "(A) banana" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445132_5435832351875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bed (highlighted by a red box)? Select from pillow (highlighted by a blue box) and lamp (highlighted by a green box).\n(A) pillow\n(B) lamp" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430935_95012134302291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, mouthwash (highlighted by a red box) or mouthwash (highlighted by a blue box)?\n(A) mouthwash\n(B) mouthwash" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896089_143924101317041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to houseplant (highlighted by a red box)? light fixture (highlighted by a blue box) or countertop (highlighted by a green box).\n(A) light fixture\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261153_605610507333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the screen door (highlighted by a red box)? magazine (highlighted by a blue box) or table (highlighted by a green box).\n(A) magazine\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898189_145110928812125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, medicine cabinet (highlighted by a red box) or brush (highlighted by a blue box)?\n(A) medicine cabinet\n(B) brush" }, { "from": "gpt", "value": "(A) medicine cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828442_91378130362666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or droplight (highlighted by a blue box)?\n(A) picture frame\n(B) droplight" }, { "from": "gpt", "value": "(B) droplight" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332473_886618175436875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from chair (highlighted by a red box)? clear (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) clear\n(B) chair" }, { "from": "gpt", "value": "(A) clear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331105_135627474857625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331541_7005920551416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) table\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895508_452058923181666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the book (highlighted by a red box)? chest of drawers (highlighted by a blue box) or book (highlighted by a green box).\n(A) chest of drawers\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333319_28427144906541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from fruit (highlighted by a red box)? appliance (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) appliance\n(B) bottle" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430839_71046242660625_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458503_113299969917958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, studio couch (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) studio couch\n(B) armchair" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333033_58901237593791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from surfboard (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and glass door (highlighted by a green box).\n(A) picture frame\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204529_2036939790375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to stool (highlighted by a red box)? Choose from curtain (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) curtain\n(B) picture frame" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332019_200766438620333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895201_40079244845666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, oven (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) oven\n(B) appliance" }, { "from": "gpt", "value": "(A) oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333117_114376650124708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430212_688729344432875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the vanity (highlighted by a red box)? bottle (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333249_33581403620291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, furniture (highlighted by a red box) or wrapping paper (highlighted by a blue box)?\n(A) furniture\n(B) wrapping paper" }, { "from": "gpt", "value": "(B) wrapping paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430248_182327285203125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331103_135979681705250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cupboard (highlighted by a red box) or door handle (highlighted by a blue box)?\n(A) cupboard\n(B) door handle" }, { "from": "gpt", "value": "(B) door handle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445168_7916526682250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from curtain (highlighted by a red box)? Choose from exhaust hood (highlighted by a blue box) and window (highlighted by a green box).\n(A) exhaust hood\n(B) window" }, { "from": "gpt", "value": "(A) exhaust hood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261507_43445526229041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, book (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) book\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018153_373389668213083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to bottle (highlighted by a red box)? shelf (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) shelf\n(B) lamp" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331711_11255511644750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, radiator (highlighted by a red box) or cupboard (highlighted by a blue box)?\n(A) radiator\n(B) cupboard" }, { "from": "gpt", "value": "(B) cupboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430236_181783973061416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to blanket (highlighted by a red box)? dish washer (highlighted by a blue box) or washing machine (highlighted by a green box).\n(A) dish washer\n(B) washing machine" }, { "from": "gpt", "value": "(B) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670048_33396911715374_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from bulletin board (highlighted by a red box)? Select from book (highlighted by a blue box) and cardboard box (highlighted by a green box).\n(A) book\n(B) cardboard box" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828476_100571058132083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or exhaust hood (highlighted by a blue box)?\n(A) cabinetry\n(B) exhaust hood" }, { "from": "gpt", "value": "(B) exhaust hood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358693_3132723525375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to television (highlighted by a red box)? mantle (highlighted by a blue box) or entertainment center (highlighted by a green box).\n(A) mantle\n(B) entertainment center" }, { "from": "gpt", "value": "(B) entertainment center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018751_7137251416625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, shelf (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) shelf\n(B) radiator" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796576_16724865728333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, screen door (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) screen door\n(B) radiator" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358340_15230421968416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the book (highlighted by a red box)? curtain (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) curtain\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796709_27485078202666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, laundry (highlighted by a red box) or door (highlighted by a blue box)?\n(A) laundry\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898621_758038306364000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204744_25370186313458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, pillow (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) pillow\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739342_46143324168625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to dog (highlighted by a red box), box (highlighted by a blue box) or box (highlighted by a green box)?\n(A) box\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739595_199654675134500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to chest of drawers (highlighted by a red box)? Select from pillow (highlighted by a blue box) and bed (highlighted by a green box).\n(A) pillow\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358162_60950733720416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from pillow (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and mirror (highlighted by a green box).\n(A) studio couch\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796438_676619730375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, electric outlet (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) electric outlet\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458228_76783774254583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from glass door (highlighted by a red box)? loudspeaker (highlighted by a blue box) or mechanical fan (highlighted by a green box)?\n(A) loudspeaker\n(B) mechanical fan" }, { "from": "gpt", "value": "(B) mechanical fan" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828243_81860993428958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bedside lamp (highlighted by a red box)? Choose from nightstand (highlighted by a blue box) and nightstand (highlighted by a green box).\n(A) nightstand\n(B) nightstand" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018844_649849307856916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from dish washer (highlighted by a red box)? Choose among these: faucet (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) faucet\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115358_4221801410958_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670184_51641741195375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, mirror (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) mirror\n(B) glass door" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796324_16015284954958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to robe (highlighted by a red box)? Choose from door (highlighted by a blue box) and robe (highlighted by a green box).\n(A) door\n(B) robe" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649732_49801195150375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chest of drawers (highlighted by a red box) or dresser (highlighted by a blue box)?\n(A) chest of drawers\n(B) dresser" }, { "from": "gpt", "value": "(B) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897653_147043776807000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from microwave oven (highlighted by a red box)? power outlet (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) power outlet\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_408916309894583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is chair (annotated by the red box) located relative to chair?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899209_186771372633583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from mirror (highlighted by a red box)? Select from tree (highlighted by a blue box) and lamp (highlighted by a green box).\n(A) tree\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899486_955370509720958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of waste container (annotated by the red box) in relation to cage? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895995_136182406505708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from lamp (highlighted by a red box)? Choose from table (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) table\n(B) picture frame" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896515_33508267862166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from lamp (highlighted by a red box)? Select from window (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) window\n(B) picture frame" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261344_24287551304958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, desk (highlighted by a red box) or laptop (highlighted by a blue box)?\n(A) desk\n(B) laptop" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333876_77208363252333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, spoon (highlighted by a red box) or square (highlighted by a blue box)?\n(A) spoon\n(B) square" }, { "from": "gpt", "value": "(A) spoon" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334158_348314826750875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, postcard (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) postcard\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899663_234447962079166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, screen door (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) screen door\n(B) curtain" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899567_958843120891458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from window (highlighted by a red box)? picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334672_391406105509708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cabinetry (highlighted by a red box) or counter (highlighted by a blue box)?\n(A) cabinetry\n(B) counter" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458329_102783622429125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the appliance (highlighted by a red box)? cabinetry (highlighted by a blue box) or furniture (highlighted by a green box).\n(A) cabinetry\n(B) furniture" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828361_80283923027958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from plain (highlighted by a red box)? Choose from bath towel (highlighted by a blue box) and electric outlet (highlighted by a green box).\n(A) bath towel\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333265_21748118037375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261219_13503521964041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from picture frame (highlighted by a red box)? picture frame (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662829_15151592906958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, screen door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) screen door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895231_73987596119166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, cabinetry (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) cabinetry\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331277_13188239871000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from appliance (highlighted by a red box)? Choose from book (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) book\n(B) cabinetry" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899559_199454704664541_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to stairwell (highlighted by a red box)? door (highlighted by a blue box) or sink (highlighted by a green box).\n(A) door\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896096_144210799197583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or bowl (highlighted by a green box).\n(A) pillow\n(B) bowl" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431082_75470127852791_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899562_199530406652250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bidet (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) bidet\n(B) tap" }, { "from": "gpt", "value": "(A) bidet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796507_3189611380291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828478_100716747833708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the chest of drawers (highlighted by a red box)? picture frame (highlighted by a blue box) or chair (highlighted by a green box).\n(A) picture frame\n(B) chair" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358661_1106996719375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, food (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) food\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204517_729169823666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, furniture (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) furniture\n(B) cabinetry" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204920_3742891622333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chest of drawers (highlighted by a red box) or medicine cabinet (highlighted by a blue box)?\n(A) chest of drawers\n(B) medicine cabinet" }, { "from": "gpt", "value": "(B) medicine cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332812_48055932830375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, kitchen appliance (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) kitchen appliance\n(B) tap" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358274_9076321459708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895263_78500474210500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, soap (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) soap\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333274_24074602493000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899898_1027034441084416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the armoire (highlighted by a red box)? furniture (highlighted by a blue box) or clothing (highlighted by a green box).\n(A) furniture\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899220_188284685829125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, glass bead (highlighted by a red box) or bay window (highlighted by a blue box)?\n(A) glass bead\n(B) bay window" }, { "from": "gpt", "value": "(A) glass bead" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429855_12702743888250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to shower (highlighted by a red box)? Choose from shower (highlighted by a blue box) and air conditioner (highlighted by a green box).\n(A) shower\n(B) air conditioner" }, { "from": "gpt", "value": "(A) shower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445211_10850317552166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897924_348995841252708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, toaster (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) toaster\n(B) counter top" }, { "from": "gpt", "value": "(A) toaster" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796517_3907400154375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) picture frame\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333329_30087521709083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of cabinet (annotated by the red box) and cardboard box in the image provided, where is cabinet (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670201_53343414570125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from pillow (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and studio couch (highlighted by a green box).\n(A) pillow\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115358_4257803083875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from door (highlighted by a red box)? Select from door (highlighted by a blue box) and laundry basket (highlighted by a green box).\n(A) door\n(B) laundry basket" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333055_60397380374458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the pillow (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or table (highlighted by a green box).\n(A) book\n(B) table" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670023_32282597337708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or wall clock (highlighted by a blue box)?\n(A) picture frame\n(B) wall clock" }, { "from": "gpt", "value": "(B) wall clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828320_76245738855833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, curtain (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) curtain\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333000_128269410128875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to shelf (highlighted by a red box)? book (highlighted by a blue box) or television (highlighted by a green box).\n(A) book\n(B) television" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898242_695960803253583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, computer monitor (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) computer monitor\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458572_258175245583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from kitchen appliance (highlighted by a red box)? kitchen appliance (highlighted by a blue box) or gas stove (highlighted by a green box)?\n(A) kitchen appliance\n(B) gas stove" }, { "from": "gpt", "value": "(B) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331625_20246343807500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) cabinetry\n(B) basket" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115255_99167486320666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from tap (highlighted by a red box)? sink (highlighted by a blue box) or counter top (highlighted by a green box)?\n(A) sink\n(B) counter top" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334912_1089918479390583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from plant (highlighted by a red box)? Select from desk (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) desk\n(B) appliance" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897720_114174629947750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from studio couch (highlighted by a red box)? pillow (highlighted by a blue box) or billiard table (highlighted by a green box)?\n(A) pillow\n(B) billiard table" }, { "from": "gpt", "value": "(B) billiard table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333479_60149500780708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to glass jar (highlighted by a red box), bottle (highlighted by a blue box) or towel bar (highlighted by a green box)?\n(A) bottle\n(B) towel bar" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333111_108657686813708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from glass vase (highlighted by a red box)? window (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) window\n(B) houseplant" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358274_9032322192666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to appliance (highlighted by a red box), cabinetry (highlighted by a blue box) or teal (highlighted by a green box)?\n(A) cabinetry\n(B) teal" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899209_186739369279666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) chair\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47330995_176935281162416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the window (highlighted by a red box)? Choose among these: houseplant (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) houseplant\n(B) lamp" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895793_680540600683541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, book (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) book\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444860_96685354561625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896487_23771015819541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from chair (highlighted by a red box)? Select from pillow (highlighted by a blue box) and radiator (highlighted by a green box).\n(A) pillow\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896126_147272520446291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to shopping bag (highlighted by a red box)? Select from radiator (highlighted by a blue box) and desk (highlighted by a green box).\n(A) radiator\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24433805904541_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895593_1161546178019500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from shelf (highlighted by a red box)? picture frame (highlighted by a blue box) or candle holder (highlighted by a green box)?\n(A) picture frame\n(B) candle holder" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898334_506648978517000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from pillow (highlighted by a red box)? pillow (highlighted by a blue box) or vase (highlighted by a green box)?\n(A) pillow\n(B) vase" }, { "from": "gpt", "value": "(B) vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429739_20180066005833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, desk (highlighted by a red box) or basin (highlighted by a blue box)?\n(A) desk\n(B) basin" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204757_26700398353875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bronze statue (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) bronze statue\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018276_794875077823875_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331174_276442795793041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, clothing (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) clothing\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445931_79335363900416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, pillow (highlighted by a red box) or window (highlighted by a blue box)?\n(A) pillow\n(B) window" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430599_315388312347166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the picture frame (highlighted by a red box)? curtain (highlighted by a blue box) or book (highlighted by a green box).\n(A) curtain\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445758_65438942635166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is furniture (annotated by the red box) located relative to garbage?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895633_471717999747416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from handbag (highlighted by a red box)? book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649603_36121608068291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, stool (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) stool\n(B) table lamp" }, { "from": "gpt", "value": "(A) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828506_102394767650208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) chair\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331894_624538945760666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to computer keyboard (highlighted by a red box)? Select from computer monitor (highlighted by a blue box) and computer monitor (highlighted by a green box).\n(A) computer monitor\n(B) computer monitor" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333033_58834831156791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to window (highlighted by a red box)? screen door (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) screen door\n(B) screen door" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331684_6493705961375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or window (highlighted by a blue box)?\n(A) door\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896187_141923114047541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to material (highlighted by a red box), picture frame (highlighted by a blue box) or oil painting (highlighted by a green box)?\n(A) picture frame\n(B) oil painting" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458337_102862722959416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from shelf (highlighted by a red box)? Choose from glass door (highlighted by a blue box) and glass door (highlighted by a green box).\n(A) glass door\n(B) glass door" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895245_75732790501041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from computer monitor (highlighted by a red box)? Choose from dresser (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) dresser\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444875_99399736467958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window (highlighted by a red box), window sill (highlighted by a blue box) or bean bag chair (highlighted by a green box)?\n(A) window sill\n(B) bean bag chair" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332812_48049935277625_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896160_139887881541916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to toilet paper (highlighted by a red box)? Choose from window (highlighted by a blue box) and light fixture (highlighted by a green box).\n(A) window\n(B) light fixture" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430901_80970657833750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window screen (highlighted by a red box), glass door (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) glass door\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446488_356797856265000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of cleaning product (annotated by the red box) and bottle in the image provided, where is cleaning product (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331710_11233320673916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) door\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358673_889099587583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, lamp (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) lamp\n(B) tap" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896223_4960991456041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from plumbing fixture (highlighted by a red box)? Choose among these: tap (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) tap\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898625_757750208366666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cleaning product (highlighted by a red box)? toiletry (highlighted by a blue box) or screen door (highlighted by a green box)?\n(A) toiletry\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669881_11006908242625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to cabinetry (highlighted by a red box)? Choose from chair (highlighted by a blue box) and chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739835_16848215679916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, toilet (highlighted by a red box) or soap dispenser (highlighted by a blue box)?\n(A) toilet\n(B) soap dispenser" }, { "from": "gpt", "value": "(B) soap dispenser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895572_1153800842024708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, houseplant (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) houseplant\n(B) counter top" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896043_130157052968916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the sink (highlighted by a red box)? Choose among these: bidet (highlighted by a blue box) or toothpaste (highlighted by a green box).\n(A) bidet\n(B) toothpaste" }, { "from": "gpt", "value": "(A) bidet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669856_12414462353708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) chair\n(B) fireplace" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333281_25670535285166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, curtain (highlighted by a red box) or plain (highlighted by a blue box)?\n(A) curtain\n(B) plain" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828507_102549353504375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from table (highlighted by a red box), chair (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) chair\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333890_78896360436291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toy (highlighted by a red box)? picture frame (highlighted by a blue box) or chest of drawers (highlighted by a green box).\n(A) picture frame\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358268_7141452751291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from kitchen & dining room table (highlighted by a red box)? curtain (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) curtain\n(B) chair" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898899_816948743794875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to countertop (highlighted by a red box), gas stove (highlighted by a blue box) or kitchen appliance (highlighted by a green box)?\n(A) gas stove\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899333_715166055986750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of chair (annotated by the red box) in reference to studio couch?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115205_95153828093166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649634_39374246223208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, door handle (highlighted by a red box) or window (highlighted by a blue box)?\n(A) door handle\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261172_1432070965541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is book (annotated by the red box) located relative to book?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018613_633569612799166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796596_18025677631083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from sink (highlighted by a red box)? Choose among these: mirror (highlighted by a blue box) or book (highlighted by a green box).\n(A) mirror\n(B) book" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445938_79442570585500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334655_389748637950750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to sink (highlighted by a red box)? bathtub (highlighted by a blue box) or basket (highlighted by a green box).\n(A) bathtub\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333035_58735238092500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, curtain (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) curtain\n(B) radiator" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204481_24895478605291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to pillow (highlighted by a red box)? Choose from plate (highlighted by a blue box) and coffee table (highlighted by a green box).\n(A) plate\n(B) coffee table" }, { "from": "gpt", "value": "(B) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333810_51911662765625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to computer keyboard (highlighted by a red box)? Select from mousepad (highlighted by a blue box) and desk (highlighted by a green box).\n(A) mousepad\n(B) desk" }, { "from": "gpt", "value": "(A) mousepad" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115504_12318307060833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toy (highlighted by a red box), book (highlighted by a blue box) or paperback book (highlighted by a green box)?\n(A) book\n(B) paperback book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895197_39249119287583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, desk (highlighted by a red box) or table (highlighted by a blue box)?\n(A) desk\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_408962907291750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of chair (annotated by the red box) and screen door in the image provided, where is chair (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332207_264519780163958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, furniture (highlighted by a red box) or food (highlighted by a blue box)?\n(A) furniture\n(B) food" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895274_79104905484333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the desk (highlighted by a red box)? bottle (highlighted by a blue box) or notepad (highlighted by a green box).\n(A) bottle\n(B) notepad" }, { "from": "gpt", "value": "(B) notepad" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670174_42289403221708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the cabinetry (highlighted by a red box)? cardboard box (highlighted by a blue box) or light switch (highlighted by a green box).\n(A) cardboard box\n(B) light switch" }, { "from": "gpt", "value": "(B) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662800_12908678652000_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018757_14862649126791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from cabinetry (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445639_58348776471291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the window sill (highlighted by a red box)? Choose among these: furniture (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) furniture\n(B) curtain" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429841_11929259557458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to microwave oven (highlighted by a red box)? cabinetry (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333268_21976308522500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, dresser (highlighted by a red box) or platter (highlighted by a blue box)?\n(A) dresser\n(B) platter" }, { "from": "gpt", "value": "(A) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261509_43562430003083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333610_76254934398125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to stool (highlighted by a red box)? tile (highlighted by a blue box) or chair (highlighted by a green box).\n(A) tile\n(B) chair" }, { "from": "gpt", "value": "(A) tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331498_153876310592666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, drawer (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) drawer\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358112_61711598729708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to flower (highlighted by a red box)? Choose from curtain (highlighted by a blue box) and table (highlighted by a green box).\n(A) curtain\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358645_3256228769708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or jug (highlighted by a blue box)?\n(A) door\n(B) jug" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331127_174315034824416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of book (annotated by the red box) in reference to book? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261087_394871184000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) furniture\n(B) shelf" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649787_45961014051750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, door (highlighted by a red box) or oven (highlighted by a blue box)?\n(A) door\n(B) oven" }, { "from": "gpt", "value": "(B) oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333776_48163434738250_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334733_535815432605291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, plant (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) plant\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331922_630799793218625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the plant (highlighted by a red box)? window (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) window\n(B) shelf" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204274_12741257374083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to chair (highlighted by a red box)? Choose from towel (highlighted by a blue box) and radiator (highlighted by a green box).\n(A) towel\n(B) radiator" }, { "from": "gpt", "value": "(A) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358252_6079641943000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430271_185495906704083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, television (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) television\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445865_70754291463166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bottle (highlighted by a red box)? Choose among these: bottle (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898621_757930600800958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, water cooler (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) water cooler\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796463_3627708736083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from cleaning product (highlighted by a red box)? Choose among these: mouthwash (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) mouthwash\n(B) picture frame" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429756_356881755529875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is trousers (annotated by the red box) located relative to radiator? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430739_336614741511333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, doormat (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) doormat\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898625_757772515868875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from appliance (highlighted by a red box)? Select from cleaning product (highlighted by a blue box) and window sill (highlighted by a green box).\n(A) cleaning product\n(B) window sill" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898587_184461773955541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of pillow (annotated by the red box) and chair in the image provided, where is pillow (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115394_3346863964583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to cabinetry (highlighted by a red box)? Select from refrigerator (highlighted by a blue box) and countertop (highlighted by a green box).\n(A) refrigerator\n(B) countertop" }, { "from": "gpt", "value": "(A) refrigerator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898261_697082536097958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from furniture (highlighted by a red box)? Choose among these: electric outlet (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) electric outlet\n(B) electric outlet" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261533_74202236169583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) picture frame\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332796_47425590529125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, book (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) book\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895571_1153740433020291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, refrigerator (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) refrigerator\n(B) footwear" }, { "from": "gpt", "value": "(A) refrigerator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899650_233698866951708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window screen (highlighted by a red box)? Select from chair (highlighted by a blue box) and dinner party (highlighted by a green box).\n(A) chair\n(B) dinner party" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358281_9163520301333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, countertop (highlighted by a red box) or clock (highlighted by a blue box)?\n(A) countertop\n(B) clock" }, { "from": "gpt", "value": "(B) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896487_23740511271875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is stool (annotated by the red box) located relative to door?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897436_104983535370791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bed (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) bed\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670291_62292223896333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) table\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204363_15806827865708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, book (highlighted by a red box) or hole (highlighted by a blue box)?\n(A) book\n(B) hole" }, { "from": "gpt", "value": "(B) hole" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261499_42640074473041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to nightstand (highlighted by a red box), lamp (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897815_132650484395832_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bedding (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) bedding\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458582_1561271878708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, shower curtain (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) shower curtain\n(B) screen door" }, { "from": "gpt", "value": "(A) shower curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898501_160037781021125_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445173_8105934591458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to chair (highlighted by a red box)? Select from window screen (highlighted by a blue box) and window (highlighted by a green box).\n(A) window screen\n(B) window" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897462_470108054435208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from straw hat (highlighted by a red box)? Choose among these: lamp (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) lamp\n(B) studio couch" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796505_3351913839375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the pillow (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or magazine (highlighted by a green box).\n(A) pillow\n(B) magazine" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358345_15190821036458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from window (highlighted by a red box)? Choose among these: light fixture (highlighted by a blue box) or counter top (highlighted by a green box).\n(A) light fixture\n(B) counter top" }, { "from": "gpt", "value": "(A) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458548_127540135150791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, television (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) television\n(B) toy" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260957_5960292070916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) window\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331390_198814203662541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of toilet (annotated by the red box) in relation to tile?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899109_128819469282791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is washing machine (annotated by the red box) located in relation to washing machine in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895975_134621607116041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, shelf (highlighted by a red box) or clock (highlighted by a blue box)?\n(A) shelf\n(B) clock" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334493_63770950313583_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444719_75392176317791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333203_46896939759875_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332184_262653617937166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chest of drawers (highlighted by a red box) or postcard (highlighted by a blue box)?\n(A) chest of drawers\n(B) postcard" }, { "from": "gpt", "value": "(B) postcard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662890_19582695986375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is stationary bicycle (annotated by the red box) located relative to window screen?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331945_165234121568708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, sink (highlighted by a red box) or mirror (highlighted by a blue box)?\n(A) sink\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445063_3561580800833_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430726_335719626088333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333803_51574838038958_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898419_1207934150375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, flower (highlighted by a red box) or candle (highlighted by a blue box)?\n(A) flower\n(B) candle" }, { "from": "gpt", "value": "(B) candle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333014_130293100434333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, book (highlighted by a red box) or bookshelf (highlighted by a blue box)?\n(A) book\n(B) bookshelf" }, { "from": "gpt", "value": "(B) bookshelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331103_135810883746083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from basket (highlighted by a red box)? Choose from counter (highlighted by a blue box) and fruit (highlighted by a green box).\n(A) counter\n(B) fruit" }, { "from": "gpt", "value": "(B) fruit" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333497_62414902076291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to studio couch (highlighted by a red box)? Choose from bean bag chair (highlighted by a blue box) and dresser (highlighted by a green box).\n(A) bean bag chair\n(B) dresser" }, { "from": "gpt", "value": "(A) bean bag chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899899_1026859429520250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from curtain (highlighted by a red box)? bed (highlighted by a blue box) or bay window (highlighted by a green box)?\n(A) bed\n(B) bay window" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331891_623240644821958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cabinetry (highlighted by a red box) or book (highlighted by a blue box)?\n(A) cabinetry\n(B) book" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895938_107679518515958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) chair\n(B) bottle" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333674_134215760039124_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, adhesive tape (highlighted by a red box) or box (highlighted by a blue box)?\n(A) adhesive tape\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_408954710681375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, screen door (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) screen door\n(B) chair" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445168_7978535296250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to curtain (highlighted by a red box), window sill (highlighted by a blue box) or window (highlighted by a green box)?\n(A) window sill\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430822_67699966977708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444781_50264907955916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670150_40467631895583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the candle holder (highlighted by a red box)? book (highlighted by a blue box) or chair (highlighted by a green box).\n(A) book\n(B) chair" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663317_76514774751375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bath (highlighted by a red box)? Choose among these: bathroom cabinet (highlighted by a blue box) or faucet (highlighted by a green box).\n(A) bathroom cabinet\n(B) faucet" }, { "from": "gpt", "value": "(B) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670100_41079114168208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to candle holder (highlighted by a red box), candle holder (highlighted by a blue box) or clock (highlighted by a green box)?\n(A) candle holder\n(B) clock" }, { "from": "gpt", "value": "(A) candle holder" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018090_104115832718375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to tap (highlighted by a red box), beach towel (highlighted by a blue box) or sink (highlighted by a green box)?\n(A) beach towel\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331512_155269919453541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to clothing (highlighted by a red box)? Select from balloon (highlighted by a blue box) and balloon (highlighted by a green box).\n(A) balloon\n(B) balloon" }, { "from": "gpt", "value": "(B) balloon" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444767_81442880033083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bed (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) bed\n(B) curtain" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358460_46747969436250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from shelf (highlighted by a red box)? Choose among these: toy (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) toy\n(B) picture frame" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895595_1161383177311666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to chair (highlighted by a red box)? Choose from basket (highlighted by a blue box) and table (highlighted by a green box).\n(A) basket\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898332_506744889236916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, nightstand (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) nightstand\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445169_7827229032166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from curtain (highlighted by a red box)? lamp (highlighted by a blue box) or studio couch (highlighted by a green box)?\n(A) lamp\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897655_147165777482333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from kitchen appliance (highlighted by a red box)? countertop (highlighted by a blue box) or kitchen appliance (highlighted by a green box)?\n(A) countertop\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899236_880505925540791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, toy (highlighted by a red box) or balloon (highlighted by a blue box)?\n(A) toy\n(B) balloon" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828369_92397014896750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from electric outlet (highlighted by a red box)? Choose among these: desk (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) desk\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429816_744609900824375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to table (highlighted by a red box)? Select from houseplant (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334912_1089936472157458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to home appliance (highlighted by a red box)? cabinetry (highlighted by a blue box) or stool (highlighted by a green box).\n(A) cabinetry\n(B) stool" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358428_41414775988791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, towel (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) towel\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261677_3015537939666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from door (highlighted by a red box)? Select from table (highlighted by a blue box) and table (highlighted by a green box).\n(A) table\n(B) table" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649426_10785401775708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from electric outlet (highlighted by a red box)? gas stove (highlighted by a blue box) or kitchen appliance (highlighted by a green box)?\n(A) gas stove\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446462_354164328460916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, pillar (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) pillar\n(B) furniture" }, { "from": "gpt", "value": "(A) pillar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471617821333875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bath towel (highlighted by a red box)? plain (highlighted by a blue box) or dish washer (highlighted by a green box).\n(A) plain\n(B) dish washer" }, { "from": "gpt", "value": "(B) dish washer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429833_748587131049750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is toy (annotated by the red box) located in relation to cardboard box in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430269_185673617809833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, television (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) television\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331159_181797012221958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, countertop (highlighted by a red box) or hand towel (highlighted by a blue box)?\n(A) countertop\n(B) hand towel" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358345_15138825051083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to cabinetry (highlighted by a red box)? Choose from curtain (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) curtain\n(B) cabinetry" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334805_429284297417541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, furniture (highlighted by a red box) or potty (highlighted by a blue box)?\n(A) furniture\n(B) potty" }, { "from": "gpt", "value": "(B) potty" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445872_71808085165083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of houseplant (annotated by the red box) in reference to window sill? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332591_362691387349083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, towel (highlighted by a red box) or shower door (highlighted by a blue box)?\n(A) towel\n(B) shower door" }, { "from": "gpt", "value": "(A) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669854_12679452550458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261153_557612970500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, mantle (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) mantle\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739919_16229162141333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, nightstand (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) nightstand\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333828_53384648784000_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115283_118246729513833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from lamp (highlighted by a red box), window (highlighted by a blue box) or window screen (highlighted by a green box)?\n(A) window\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446561_86503469195416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to appliance (highlighted by a red box), cabinetry (highlighted by a blue box) or kitchen appliance (highlighted by a green box)?\n(A) cabinetry\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430862_74313894479250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to book (highlighted by a red box)? Choose from bed (highlighted by a blue box) and nightstand (highlighted by a green box).\n(A) bed\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458552_127491438704583_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739912_15666492099833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from studio couch (highlighted by a red box), blanket (highlighted by a blue box) or bedding (highlighted by a green box)?\n(A) blanket\n(B) bedding" }, { "from": "gpt", "value": "(B) bedding" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897434_104175221949916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from screen door (highlighted by a red box)? chest of drawers (highlighted by a blue box) or book (highlighted by a green box)?\n(A) chest of drawers\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261089_474155061500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to basket (highlighted by a red box)? Choose from basket (highlighted by a blue box) and mixing bowl (highlighted by a green box).\n(A) basket\n(B) mixing bowl" }, { "from": "gpt", "value": "(A) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24617497247666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bottle (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) bottle\n(B) picture frame" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895797_680620401710625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) picture frame\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796326_16278076190625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, desk (highlighted by a red box) or coffee cup (highlighted by a blue box)?\n(A) desk\n(B) coffee cup" }, { "from": "gpt", "value": "(B) coffee cup" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260895_8752706323625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bottle (highlighted by a red box) or beach towel (highlighted by a blue box)?\n(A) bottle\n(B) beach towel" }, { "from": "gpt", "value": "(B) beach towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261407_29657209679541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from lamp (highlighted by a red box)? Choose from door (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) door\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446485_355724347512625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from desk (highlighted by a red box), table (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261089_494163451416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, tableware (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) tableware\n(B) shelf" }, { "from": "gpt", "value": "(A) tableware" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649794_46012810223041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of pillow (annotated by the red box) in reference to pillow? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331498_153890304912750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, electric outlet (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) electric outlet\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332758_43233326543625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to door (highlighted by a red box)? square (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) square\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333040_59654756138625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the gas stove (highlighted by a red box)? writing (highlighted by a blue box) or counter top (highlighted by a green box).\n(A) writing\n(B) counter top" }, { "from": "gpt", "value": "(B) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332022_202461106241458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, pillow (highlighted by a red box) or couch (highlighted by a blue box)?\n(A) pillow\n(B) couch" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896247_7597088775333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from window sill (highlighted by a red box)? Choose from curtain (highlighted by a blue box) and nightstand (highlighted by a green box).\n(A) curtain\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796190_388330987416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, nightstand (highlighted by a red box) or alarm clock (highlighted by a blue box)?\n(A) nightstand\n(B) alarm clock" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430934_94917439437916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, waste (highlighted by a red box) or towel (highlighted by a blue box)?\n(A) waste\n(B) towel" }, { "from": "gpt", "value": "(A) waste" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204920_3764882914583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the lamp (highlighted by a red box)? pillow (highlighted by a blue box) or nightstand (highlighted by a green box).\n(A) pillow\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897870_529962964770791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, appliance (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) appliance\n(B) houseplant" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334890_623255956222125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649597_35915710240625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or coffee cup (highlighted by a blue box)?\n(A) chair\n(B) coffee cup" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458729_138457729485166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of home appliance (annotated by the red box) in relation to cloth?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358105_61815489092125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to tablecloth (highlighted by a red box)? Choose from blanket (highlighted by a blue box) and window screen (highlighted by a green box).\n(A) blanket\n(B) window screen" }, { "from": "gpt", "value": "(A) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334787_426436979816625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261709_1448627928583_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430568_309773789069333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to toilet paper (highlighted by a red box), toilet paper (highlighted by a blue box) or robe (highlighted by a green box)?\n(A) toilet paper\n(B) robe" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429682_10534825652166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828439_90631950613833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from curtain (highlighted by a red box)? window (highlighted by a blue box) or tea pot (highlighted by a green box)?\n(A) window\n(B) tea pot" }, { "from": "gpt", "value": "(B) tea pot" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895192_38435129553166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to cardboard box (highlighted by a red box), basket (highlighted by a blue box) or towel (highlighted by a green box)?\n(A) basket\n(B) towel" }, { "from": "gpt", "value": "(A) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334037_278451810996458_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897590_135016647534791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to cabinetry (highlighted by a red box)? Select from door (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) door\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662912_19975761104041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to book (highlighted by a red box), bedside lamp (highlighted by a blue box) or nightstand (highlighted by a green box)?\n(A) bedside lamp\n(B) nightstand" }, { "from": "gpt", "value": "(A) bedside lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261533_74174231093166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, coffee table (highlighted by a red box) or table (highlighted by a blue box)?\n(A) coffee table\n(B) table" }, { "from": "gpt", "value": "(A) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739912_15704493743541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window screen (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) window screen\n(B) toy" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430097_28808881439041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, storage box (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) storage box\n(B) shelf" }, { "from": "gpt", "value": "(A) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458262_74149138685833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, computer keyboard (highlighted by a red box) or bookshelf (highlighted by a blue box)?\n(A) computer keyboard\n(B) bookshelf" }, { "from": "gpt", "value": "(B) bookshelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662835_15905646367208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898625_757746210008708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the mouthwash (highlighted by a red box)? screen door (highlighted by a blue box) or cleaning product (highlighted by a green box).\n(A) screen door\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649603_36045606335458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896089_143876104510458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to picture frame (highlighted by a red box), table (highlighted by a blue box) or swivel chair (highlighted by a green box)?\n(A) table\n(B) swivel chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358173_62411030996375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331942_164669820807916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to cardboard box (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and handbag (highlighted by a green box).\n(A) furniture\n(B) handbag" }, { "from": "gpt", "value": "(B) handbag" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446493_356480652745291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to appliance (highlighted by a red box)? Select from appliance (highlighted by a blue box) and toaster (highlighted by a green box).\n(A) appliance\n(B) toaster" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332598_362989822870333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from sink (highlighted by a red box)? Select from faucet (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) faucet\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649681_35595826122333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to mirror (highlighted by a red box)? soap dispenser (highlighted by a blue box) or sink (highlighted by a green box).\n(A) soap dispenser\n(B) sink" }, { "from": "gpt", "value": "(A) soap dispenser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828493_101922284814416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of screen door (annotated by the red box) and stool in the image provided, where is screen door (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358710_5077857905166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, door (highlighted by a red box) or balustrade (highlighted by a blue box)?\n(A) door\n(B) balustrade" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430962_99363269966791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, furniture (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) furniture\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204291_14512091560708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the home appliance (highlighted by a red box)? vanity (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) vanity\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445594_285327533401833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) picture frame\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334163_348181830264708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896009_137208262146916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or book (highlighted by a blue box)?\n(A) chair\n(B) book" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897757_117851208256333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, studio couch (highlighted by a red box) or throw pillow (highlighted by a blue box)?\n(A) studio couch\n(B) throw pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261541_74287734098750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from studio couch (highlighted by a red box)? Choose from studio couch (highlighted by a blue box) and toy (highlighted by a green box).\n(A) studio couch\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895245_75752782303083_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204736_24083347289083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the door (highlighted by a red box)? blanket (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) blanket\n(B) electric outlet" }, { "from": "gpt", "value": "(A) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430982_101620730180041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the studio couch (highlighted by a red box)? Choose among these: bunk bed (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) bunk bed\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897755_117576122334333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from pillow (highlighted by a red box)? Choose from table lamp (highlighted by a blue box) and chair (highlighted by a green box).\n(A) table lamp\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115379_1869384624166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) window\n(B) radiator" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204529_2044936480916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the pillow (highlighted by a red box)? Choose among these: window (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) window\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796721_27341884844916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, light switch (highlighted by a red box) or door (highlighted by a blue box)?\n(A) light switch\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333268_22058308385125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from tableware (highlighted by a red box)? glass jar (highlighted by a blue box) or mug (highlighted by a green box)?\n(A) glass jar\n(B) mug" }, { "from": "gpt", "value": "(A) glass jar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649391_10995407066583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or table (highlighted by a blue box)?\n(A) picture frame\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204670_12439133291791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458525_125958952742083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334286_161215637991833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, furniture (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) furniture\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331512_155210810094125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, light switch (highlighted by a red box) or closet (highlighted by a blue box)?\n(A) light switch\n(B) closet" }, { "from": "gpt", "value": "(B) closet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897951_533585324529957_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, furniture (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) furniture\n(B) appliance" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204505_872760255416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, stool (highlighted by a red box) or stool (highlighted by a blue box)?\n(A) stool\n(B) stool" }, { "from": "gpt", "value": "(B) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649440_12565540544333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, mug (highlighted by a red box) or mug (highlighted by a blue box)?\n(A) mug\n(B) mug" }, { "from": "gpt", "value": "(B) mug" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333876_77226372606333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from cabinetry (highlighted by a red box)? dresser (highlighted by a blue box) or counter top (highlighted by a green box)?\n(A) dresser\n(B) counter top" }, { "from": "gpt", "value": "(A) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331216_281073047695333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to door (highlighted by a red box)? Select from door (highlighted by a blue box) and doormat (highlighted by a green box).\n(A) door\n(B) doormat" }, { "from": "gpt", "value": "(B) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796745_28665882271250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, picture frame (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) picture frame\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333292_26373535273625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, toilet paper (highlighted by a red box) or brush (highlighted by a blue box)?\n(A) toilet paper\n(B) brush" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663258_77840869012375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to appliance (highlighted by a red box)? countertop (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) countertop\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115194_105612655990166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cardboard box (highlighted by a red box) or storage box (highlighted by a blue box)?\n(A) cardboard box\n(B) storage box" }, { "from": "gpt", "value": "(A) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260957_5952295235875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from glass door (highlighted by a red box)? toiletry (highlighted by a blue box) or desk (highlighted by a green box)?\n(A) toiletry\n(B) desk" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796498_1576070552125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, lamp (highlighted by a red box) or table (highlighted by a blue box)?\n(A) lamp\n(B) table" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334737_536758532916458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from material (highlighted by a red box)? Choose among these: beach towel (highlighted by a blue box) or beach towel (highlighted by a green box).\n(A) beach towel\n(B) beach towel" }, { "from": "gpt", "value": "(B) beach towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828230_69796631401583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from studio couch (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) pillow\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115442_11680240901000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from basket (highlighted by a red box), chest of drawers (highlighted by a blue box) or bedding (highlighted by a green box)?\n(A) chest of drawers\n(B) bedding" }, { "from": "gpt", "value": "(B) bedding" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358263_7285562374208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from appliance (highlighted by a red box)? Choose among these: electric outlet (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) electric outlet\n(B) electric outlet" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333513_48700087805458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, window (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) window\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429764_358143449692000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, houseplant (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) houseplant\n(B) window sill" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446488_356876157467625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from bucket (highlighted by a red box), desk (highlighted by a blue box) or toilet paper (highlighted by a green box)?\n(A) desk\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897655_147167776673291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, kitchen appliance (highlighted by a red box) or food (highlighted by a blue box)?\n(A) kitchen appliance\n(B) food" }, { "from": "gpt", "value": "(B) food" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670168_42208201986041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or vent (highlighted by a blue box)?\n(A) cabinetry\n(B) vent" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649478_14990840583416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to furniture (highlighted by a red box)? radiator (highlighted by a blue box) or plaid (highlighted by a green box).\n(A) radiator\n(B) plaid" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115628_3421094320416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261153_557612970500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, fireplace (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) fireplace\n(B) pillow" }, { "from": "gpt", "value": "(A) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739814_15595649815083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cabinetry (highlighted by a red box) or door (highlighted by a blue box)?\n(A) cabinetry\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331899_624429339927333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, shelf (highlighted by a red box) or light fixture (highlighted by a blue box)?\n(A) shelf\n(B) light fixture" }, { "from": "gpt", "value": "(B) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899030_643070584318166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) chair\n(B) desk" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649382_10560251820250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or table (highlighted by a blue box)?\n(A) picture frame\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739275_42712874504208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to cabinet (highlighted by a red box)? Choose from table lamp (highlighted by a blue box) and table (highlighted by a green box).\n(A) table lamp\n(B) table" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669880_11280299844500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the chair (highlighted by a red box)? Choose among these: wine bottle (highlighted by a blue box) or kitchen & dining room table (highlighted by a green box).\n(A) wine bottle\n(B) kitchen & dining room table" }, { "from": "gpt", "value": "(B) kitchen & dining room table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333785_48875966941625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, houseplant (highlighted by a red box) or flowerpot (highlighted by a blue box)?\n(A) houseplant\n(B) flowerpot" }, { "from": "gpt", "value": "(B) flowerpot" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358700_5226665571333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picnic basket (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) picnic basket\n(B) toilet paper" }, { "from": "gpt", "value": "(A) picnic basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896524_34616722380916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from toy (highlighted by a red box)? paperback book (highlighted by a blue box) or toy (highlighted by a green box)?\n(A) paperback book\n(B) toy" }, { "from": "gpt", "value": "(A) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828245_81743392107875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, nightstand (highlighted by a red box) or bedside lamp (highlighted by a blue box)?\n(A) nightstand\n(B) bedside lamp" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331277_13234437547625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, pillow (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) pillow\n(B) paperback book" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331525_191693687424333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, trousers (highlighted by a red box) or bathtub (highlighted by a blue box)?\n(A) trousers\n(B) bathtub" }, { "from": "gpt", "value": "(A) trousers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358386_19282745555000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the rail (highlighted by a red box)? Choose among these: tree (highlighted by a blue box) or stairs (highlighted by a green box).\n(A) tree\n(B) stairs" }, { "from": "gpt", "value": "(A) tree" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458260_74293048474291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cardboard box (highlighted by a red box)? Choose among these: box (highlighted by a blue box) or storage box (highlighted by a green box).\n(A) box\n(B) storage box" }, { "from": "gpt", "value": "(B) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331520_190704271226333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, lamp (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) lamp\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115300_119452627371250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115174_104174749436208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, cabinetry (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) cabinetry\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898621_757944611692625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bottle (highlighted by a red box) or waste container (highlighted by a blue box)?\n(A) bottle\n(B) waste container" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018760_15091456775083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or remote control (highlighted by a blue box)?\n(A) chair\n(B) remote control" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796709_27425085280125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, coffee machine (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) coffee machine\n(B) ceramic tile" }, { "from": "gpt", "value": "(A) coffee machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333870_76206178838416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, furniture (highlighted by a red box) or cat bed (highlighted by a blue box)?\n(A) furniture\n(B) cat bed" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670001_29837676347583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, home appliance (highlighted by a red box) or hardwood (highlighted by a blue box)?\n(A) home appliance\n(B) hardwood" }, { "from": "gpt", "value": "(B) hardwood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204678_12482432834625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to picnic basket (highlighted by a red box)? Select from window (highlighted by a blue box) and chair (highlighted by a green box).\n(A) window\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332988_124406174045333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from toilet paper (highlighted by a red box)? Choose from counter top (highlighted by a blue box) and toiletry (highlighted by a green box).\n(A) counter top\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899957_865530962393166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bed (highlighted by a red box)? Choose among these: dresser (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) dresser\n(B) screen door" }, { "from": "gpt", "value": "(A) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896096_144248800088583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) picture frame\n(B) chair" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018063_718860822926875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, towel (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) towel\n(B) clothing" }, { "from": "gpt", "value": "(A) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333665_131858408546375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739603_199547384229750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, window screen (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) window screen\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828449_91289232314333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from pillow (highlighted by a red box)? window (highlighted by a blue box) or door (highlighted by a green box)?\n(A) window\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897955_216394430266791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window blind (highlighted by a red box) or window blind (highlighted by a blue box)?\n(A) window blind\n(B) window blind" }, { "from": "gpt", "value": "(B) window blind" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895972_406459550360250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, toy (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) toy\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430209_688550949806875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) picture frame\n(B) ceramic tile" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018853_650489072131083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from toilet paper (highlighted by a red box)? Choose among these: sink (highlighted by a blue box) or bidet (highlighted by a green box).\n(A) sink\n(B) bidet" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332597_363026524693875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, pizza (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) pizza\n(B) counter top" }, { "from": "gpt", "value": "(A) pizza" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332207_264533774481958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to chair (highlighted by a red box)? chair (highlighted by a blue box) or swivel chair (highlighted by a green box).\n(A) chair\n(B) swivel chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458206_74611771420875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the clothing (highlighted by a red box)? picture frame (highlighted by a blue box) or glass door (highlighted by a green box).\n(A) picture frame\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896103_145392912543625_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331183_277502011495166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of houseplant (annotated by the red box) in reference to window?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897426_104124226508541_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from plain (highlighted by a red box)? table (highlighted by a blue box) or door (highlighted by a green box)?\n(A) table\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430795_60930069806541_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from picture frame (highlighted by a red box)? Select from door (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) door\n(B) picture frame" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898254_696650030986416_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018063_718862822113708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, clothing (highlighted by a red box) or gear (highlighted by a blue box)?\n(A) clothing\n(B) gear" }, { "from": "gpt", "value": "(A) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358660_1021197354208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bottle (highlighted by a red box) or window (highlighted by a blue box)?\n(A) bottle\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898256_696472037298833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from book (highlighted by a red box)? book cover (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) book cover\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649633_39571247952416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of cabinetry (annotated by the red box) in reference to toilet?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429822_744712892050833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of window (annotated by the red box) in reference to door?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663064_38516488927166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the table (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) chair\n(B) curtain" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331479_150943134942500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of door (annotated by the red box) in relation to postcard?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649409_10252693552833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from pillow (highlighted by a red box)? Select from ladder (highlighted by a blue box) and chair (highlighted by a green box).\n(A) ladder\n(B) chair" }, { "from": "gpt", "value": "(A) ladder" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669959_27782095505583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or garbage (highlighted by a blue box)?\n(A) door\n(B) garbage" }, { "from": "gpt", "value": "(B) garbage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331542_6884919377750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, desk (highlighted by a red box) or television (highlighted by a blue box)?\n(A) desk\n(B) television" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446025_134695305336416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, baby carriage (highlighted by a red box) or cat (highlighted by a blue box)?\n(A) baby carriage\n(B) cat" }, { "from": "gpt", "value": "(A) baby carriage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897462_470186055416125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from picture frame (highlighted by a red box), lamp (highlighted by a blue box) or window (highlighted by a green box)?\n(A) lamp\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430414_127123500426541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, porcelain (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) porcelain\n(B) bath towel" }, { "from": "gpt", "value": "(A) porcelain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430592_311059312169500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from plastic bag (highlighted by a red box), plastic bag (highlighted by a blue box) or cardboard box (highlighted by a green box)?\n(A) plastic bag\n(B) cardboard box" }, { "from": "gpt", "value": "(A) plastic bag" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334194_355781022070333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from bottle (highlighted by a red box)? Choose from faucet (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) faucet\n(B) bottle" }, { "from": "gpt", "value": "(A) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662908_20196852625958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to pillow (highlighted by a red box), radiator (highlighted by a blue box) or glass door (highlighted by a green box)?\n(A) radiator\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115260_115066274966541_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358117_62364082667791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the oven (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or kitchen appliance (highlighted by a green box).\n(A) cabinetry\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649451_12759247198125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, poster page (highlighted by a red box) or equipment (highlighted by a blue box)?\n(A) poster page\n(B) equipment" }, { "from": "gpt", "value": "(A) poster page" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649742_49600995183333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from studio couch (highlighted by a red box), table (highlighted by a blue box) or bar stool (highlighted by a green box)?\n(A) table\n(B) bar stool" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896404_16677218619914_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, washing machine (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) washing machine\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331606_18452007988791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of bathtub (annotated by the red box) in relation to doll?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333870_76219073606625_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458249_79368165627291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, toiletry (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) toiletry\n(B) bath mat" }, { "from": "gpt", "value": "(B) bath mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739751_4172097571333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) door\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115283_118298742290583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from basket (highlighted by a red box)? countertop (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) countertop\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670150_40497636701333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) picture frame\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895938_107679518515958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from desk (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and table lamp (highlighted by a green box).\n(A) picture frame\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796477_4130730011083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, light fixture (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) light fixture\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333310_28204635869833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, medicine cabinet (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) medicine cabinet\n(B) radiator" }, { "from": "gpt", "value": "(A) medicine cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796216_1982234240041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) picture frame\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446466_355402462214458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from cabinetry (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) chair\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333233_32323472367125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of studio couch (annotated by the red box) and table in the image provided, where is studio couch (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895956_133503162772415_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, blind (highlighted by a red box) or television (highlighted by a blue box)?\n(A) blind\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899950_864881628880458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from garbage (highlighted by a red box)? stairwell (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) stairwell\n(B) furniture" }, { "from": "gpt", "value": "(A) stairwell" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739925_16354462559500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from window sill (highlighted by a red box)? window screen (highlighted by a blue box) or nightstand (highlighted by a green box)?\n(A) window screen\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332397_401442501790541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, window (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) window\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115352_4065016561666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, swivel chair (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) swivel chair\n(B) pillow" }, { "from": "gpt", "value": "(A) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899936_863448269695166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to cabinetry (highlighted by a red box), cabinetry (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) cabinetry\n(B) bottle" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899975_792662659291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from picnic basket (highlighted by a red box)? studio couch (highlighted by a blue box) or window screen (highlighted by a green box)?\n(A) studio couch\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018760_15067349860958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from armchair (highlighted by a red box)? houseplant (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) houseplant\n(B) cabinetry" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458562_128128223319916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from electric outlet (highlighted by a red box)? footwear (highlighted by a blue box) or waste container (highlighted by a green box)?\n(A) footwear\n(B) waste container" }, { "from": "gpt", "value": "(B) waste container" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331276_12791751847583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, shelf (highlighted by a red box) or box (highlighted by a blue box)?\n(A) shelf\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333239_32202971020041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from glass jar (highlighted by a red box)? Choose from door (highlighted by a blue box) and toy (highlighted by a green box).\n(A) door\n(B) toy" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899232_880555638558125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, glass vase (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) glass vase\n(B) lamp" }, { "from": "gpt", "value": "(A) glass vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261332_24031133026416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bathtub (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) bathtub\n(B) concrete" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897478_112745148233291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bed (highlighted by a red box) or towel (highlighted by a blue box)?\n(A) bed\n(B) towel" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430262_185387417335708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from glass plate (highlighted by a red box), bookcase (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) bookcase\n(B) cabinetry" }, { "from": "gpt", "value": "(A) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204329_14349614128791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from coffee cup (highlighted by a red box)? Choose among these: closet (highlighted by a blue box) or mirror (highlighted by a green box).\n(A) closet\n(B) mirror" }, { "from": "gpt", "value": "(A) closet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739846_17116427359458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the window sill (highlighted by a red box)? Choose among these: window (highlighted by a blue box) or door (highlighted by a green box).\n(A) window\n(B) door" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333293_26506630548333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toilet paper (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) toilet paper\n(B) toilet paper" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261675_3127441572958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cabinetry (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) cabinetry\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333288_25287824915291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to nightstand (highlighted by a red box)? bed (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) bed\n(B) picture frame" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204363_15862922341083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from cardboard box (highlighted by a red box)? Select from cardboard box (highlighted by a blue box) and chair (highlighted by a green box).\n(A) cardboard box\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898254_696684033679708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the cabinetry (highlighted by a red box)? paperback book (highlighted by a blue box) or book (highlighted by a green box).\n(A) paperback book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895469_132819922456083_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828369_92383020685166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to chair (highlighted by a red box), chair (highlighted by a blue box) or armchair (highlighted by a green box)?\n(A) chair\n(B) armchair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_408922307414166_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899600_202660422646333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, screen door (highlighted by a red box) or glass vase (highlighted by a blue box)?\n(A) screen door\n(B) glass vase" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670323_65684774851790_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or animal (highlighted by a blue box)?\n(A) chair\n(B) animal" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331127_174284747072291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, radiator (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) radiator\n(B) pillow" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333233_32339465924041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, table (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) table\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115624_3605088221000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895201_40081244034125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, desk (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) desk\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445692_63112678082541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of chest of drawers (annotated by the red box) and radiator in the image provided, where is chest of drawers (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333325_29549032972458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, desk (highlighted by a red box) or vase (highlighted by a blue box)?\n(A) desk\n(B) vase" }, { "from": "gpt", "value": "(B) vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332705_109838912975958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from clothing (highlighted by a red box)? door (highlighted by a blue box) or light switch (highlighted by a green box)?\n(A) door\n(B) light switch" }, { "from": "gpt", "value": "(B) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115205_95213836200083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) chair\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333778_48353541011583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cardboard box (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) cardboard box\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334040_278871007511291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from table (highlighted by a red box)? Select from mat (highlighted by a blue box) and chair (highlighted by a green box).\n(A) mat\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333873_76259373924791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from television (highlighted by a red box), bottle (highlighted by a blue box) or remote (highlighted by a green box)?\n(A) bottle\n(B) remote" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334624_385768521852833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) table\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261158_664903648333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window screen (highlighted by a red box), studio couch (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445599_285053829664833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the curtain (highlighted by a red box)? Choose among these: window sill (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) window sill\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429822_744668593480583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bed (highlighted by a red box)? Select from pillow (highlighted by a blue box) and chair (highlighted by a green box).\n(A) pillow\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332152_259937932233166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is screen door (annotated by the red box) located relative to furniture? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430822_67719175879125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) table\n(B) toy" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446466_355478447908541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from swivel chair (highlighted by a red box)? Select from chair (highlighted by a blue box) and mat (highlighted by a green box).\n(A) chair\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649798_46118518389208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to studio couch (highlighted by a red box)? Choose from mat (highlighted by a blue box) and table (highlighted by a green box).\n(A) mat\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332396_401352804906833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from shelf (highlighted by a red box)? Select from pillow (highlighted by a blue box) and book (highlighted by a green box).\n(A) pillow\n(B) book" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354619026041666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of furniture (annotated by the red box) in relation to furniture? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670184_51658234337625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, lamp (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) lamp\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896224_4912694907291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, radiator (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) radiator\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899333_715092953017791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to microwave oven (highlighted by a red box)? sink (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) sink\n(B) cabinetry" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828328_77650578472833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the chair (highlighted by a red box)? blanket (highlighted by a blue box) or door (highlighted by a green box).\n(A) blanket\n(B) door" }, { "from": "gpt", "value": "(A) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897560_473437296138000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, furniture (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) furniture\n(B) radiator" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331479_150923143013541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, home appliance (highlighted by a red box) or food (highlighted by a blue box)?\n(A) home appliance\n(B) food" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260892_8799203662916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, candle (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) candle\n(B) bath mat" }, { "from": "gpt", "value": "(A) candle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334032_273499208307333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) cabinetry\n(B) lamp" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115205_95189829636625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to table (highlighted by a red box)? Select from chair (highlighted by a blue box) and chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898903_817222031972250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to counter (highlighted by a red box)? Select from furniture (highlighted by a blue box) and table (highlighted by a green box).\n(A) furniture\n(B) table" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662805_13545992772791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to table (highlighted by a red box), radiator (highlighted by a blue box) or door (highlighted by a green box)?\n(A) radiator\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670158_40778142339708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, kitchen appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) kitchen appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332503_344012983053708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, studio couch (highlighted by a red box) or table (highlighted by a blue box)?\n(A) studio couch\n(B) table" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331277_13067955818708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to home appliance (highlighted by a red box)? Choose from video camera (highlighted by a blue box) and home appliance (highlighted by a green box).\n(A) video camera\n(B) home appliance" }, { "from": "gpt", "value": "(A) video camera" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445799_67025112969541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, screen door (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) screen door\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898221_164153438909833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to shoe (highlighted by a red box)? food (highlighted by a blue box) or shoe (highlighted by a green box).\n(A) food\n(B) shoe" }, { "from": "gpt", "value": "(B) shoe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895972_406429062902083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is chair (annotated by the red box) located in relation to chair in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204877_3569030107083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) door\n(B) bath towel" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334876_621679921671291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from string (highlighted by a red box)? paperback book (highlighted by a blue box) or clock (highlighted by a green box)?\n(A) paperback book\n(B) clock" }, { "from": "gpt", "value": "(B) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261499_42644072892000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of picture frame (annotated by the red box) and window in the image provided, where is picture frame (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896522_34694323573540_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, glass jar (highlighted by a red box) or book (highlighted by a blue box)?\n(A) glass jar\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895574_1153837244019750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, counter top (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) counter top\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445128_5116232753333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, entertainment center (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) entertainment center\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896310_6761731835666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to table (highlighted by a red box), picnic basket (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) picnic basket\n(B) shelf" }, { "from": "gpt", "value": "(A) picnic basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444768_81498773876500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from shoulder bag (highlighted by a red box)? door (highlighted by a blue box) or door (highlighted by a green box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358230_10116569957875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from pillow (highlighted by a red box)? Choose among these: bed (highlighted by a blue box) or nightstand (highlighted by a green box).\n(A) bed\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897482_112622746664250_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899282_885215964979750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to blender (highlighted by a red box)? Choose from slow cooker (highlighted by a blue box) and produce (highlighted by a green box).\n(A) slow cooker\n(B) produce" }, { "from": "gpt", "value": "(A) slow cooker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334226_107186012096291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, shelf (highlighted by a red box) or drawer (highlighted by a blue box)?\n(A) shelf\n(B) drawer" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897653_147013672301166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662833_15807153820750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from picture frame (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and flower (highlighted by a green box).\n(A) picture frame\n(B) flower" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662890_19574699305250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) door\n(B) radiator" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458690_135442795085875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to television (highlighted by a red box)? Select from footrest (highlighted by a blue box) and desk (highlighted by a green box).\n(A) footrest\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115650_4723446505791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to table (highlighted by a red box), pillow (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) pillow\n(B) picture frame" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332290_385267592146291_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334621_385421929758541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332320_390835671332500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, shelf (highlighted by a red box) or magazine (highlighted by a blue box)?\n(A) shelf\n(B) magazine" }, { "from": "gpt", "value": "(B) magazine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458706_136836471911375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from sink (highlighted by a red box)? Select from counter (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) counter\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739574_198474248827541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or window (highlighted by a blue box)?\n(A) picture frame\n(B) window" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897509_472336406465750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from dumbbell (highlighted by a red box)? Select from dumbbell (highlighted by a blue box) and barbell (highlighted by a green box).\n(A) dumbbell\n(B) barbell" }, { "from": "gpt", "value": "(B) barbell" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115235_95835239251416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of table (annotated by the red box) in relation to cardboard box? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828476_100597047380208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the swivel chair (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) appliance\n(B) bottle" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261455_35799455506375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, pillow (highlighted by a red box) or flat (highlighted by a blue box)?\n(A) pillow\n(B) flat" }, { "from": "gpt", "value": "(B) flat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663250_74996280675291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the lamp (highlighted by a red box)? lamp (highlighted by a blue box) or television (highlighted by a green box).\n(A) lamp\n(B) television" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899650_233731070871750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896096_144240786749583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the table (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or plywood (highlighted by a green box).\n(A) chair\n(B) plywood" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11267694139833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, paperback book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) paperback book\n(B) book" }, { "from": "gpt", "value": "(A) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897480_470959427790708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, curtain (highlighted by a red box) or box (highlighted by a blue box)?\n(A) curtain\n(B) box" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899284_885324353325958_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670168_42198205936791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, lemon (highlighted by a red box) or pad (highlighted by a blue box)?\n(A) lemon\n(B) pad" }, { "from": "gpt", "value": "(B) pad" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895577_1155258153289166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, towel bar (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) towel bar\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895469_132740021905666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) table\n(B) picture frame" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429841_11913266038041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to microwave oven (highlighted by a red box)? Select from toy (highlighted by a blue box) and document (highlighted by a green box).\n(A) toy\n(B) document" }, { "from": "gpt", "value": "(B) document" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446061_80607075007041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is medicine cabinet (annotated by the red box) located relative to home appliance? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332591_362651186948875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, screen door (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) screen door\n(B) screen door" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261378_26930011146541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window frame (highlighted by a red box) or stationary bicycle (highlighted by a blue box)?\n(A) window frame\n(B) stationary bicycle" }, { "from": "gpt", "value": "(B) stationary bicycle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828368_92185519080833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cabinetry (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) cabinetry\n(B) glass door" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331800_227934374993333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the basket (highlighted by a red box)? bottle (highlighted by a blue box) or countertop (highlighted by a green box).\n(A) bottle\n(B) countertop" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430221_180215397573333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from computer tower (highlighted by a red box)? radiator (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) radiator\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897547_473244092588833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chest of drawers (highlighted by a red box) or cat bed (highlighted by a blue box)?\n(A) chest of drawers\n(B) cat bed" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895818_685982233351708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to medicine cabinet (highlighted by a red box), mirror (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) mirror\n(B) bottle" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115338_2249263374958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from book (highlighted by a red box)? Select from book (highlighted by a blue box) and shelf (highlighted by a green box).\n(A) book\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737958726849083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to fireplace (highlighted by a red box)? curtain (highlighted by a blue box) or armchair (highlighted by a green box).\n(A) curtain\n(B) armchair" }, { "from": "gpt", "value": "(B) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204474_25089568265750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to picture frame (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and toy (highlighted by a green box).\n(A) picture frame\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332109_683200213093666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, sheet (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) sheet\n(B) radiator" }, { "from": "gpt", "value": "(A) sheet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828231_70018226976916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from plain (highlighted by a red box)? Choose among these: studio couch (highlighted by a blue box) or blanket (highlighted by a green box).\n(A) studio couch\n(B) blanket" }, { "from": "gpt", "value": "(B) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332389_398733115098750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to stationery (highlighted by a red box)? Choose from bag (highlighted by a blue box) and desk (highlighted by a green box).\n(A) bag\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204274_12749254061708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from door (highlighted by a red box)? glass door (highlighted by a blue box) or cleaning product (highlighted by a green box)?\n(A) glass door\n(B) cleaning product" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739930_16745209767833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, toilet paper (highlighted by a red box) or towel bar (highlighted by a blue box)?\n(A) toilet paper\n(B) towel bar" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204589_553213747166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, sink (highlighted by a red box) or door (highlighted by a blue box)?\n(A) sink\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895507_452130527537708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, footwear (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) footwear\n(B) footwear" }, { "from": "gpt", "value": "(A) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895272_79348106806250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to tableware (highlighted by a red box)? Select from sink (highlighted by a blue box) and tap (highlighted by a green box).\n(A) sink\n(B) tap" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899955_865610862726333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, dresser (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) dresser\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332204_264172870823041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332769_43692021027958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of furniture (annotated by the red box) and window sill in the image provided, where is furniture (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898571_183831092366291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the mirror (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or chair (highlighted by a green box).\n(A) pillow\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670218_53987961228333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from picture frame (highlighted by a red box)? candle (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) candle\n(B) furniture" }, { "from": "gpt", "value": "(A) candle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333298_26630429451500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from toiletry (highlighted by a red box)? Choose among these: bath towel (highlighted by a blue box) or brush (highlighted by a green box).\n(A) bath towel\n(B) brush" }, { "from": "gpt", "value": "(B) brush" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445057_3397280303541_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from window (highlighted by a red box)? radiator (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) radiator\n(B) curtain" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649451_12771242452958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to picture frame (highlighted by a red box), picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333018_130157205398500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from poster (highlighted by a red box), poster (highlighted by a blue box) or poster (highlighted by a green box)?\n(A) poster\n(B) poster" }, { "from": "gpt", "value": "(A) poster" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11241704939125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of furniture (annotated by the red box) in relation to plywood?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260877_7391163168875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, studio couch (highlighted by a red box) or bowl (highlighted by a blue box)?\n(A) studio couch\n(B) bowl" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444916_220539169589541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) window\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445691_57465381076375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from grocery bag (highlighted by a red box), backpack (highlighted by a blue box) or clothing (highlighted by a green box)?\n(A) backpack\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446579_205799452807041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from houseplant (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or vegetation (highlighted by a green box).\n(A) book\n(B) vegetation" }, { "from": "gpt", "value": "(B) vegetation" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332197_263686738730666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to bath mat (highlighted by a red box), bath (highlighted by a blue box) or toilet paper (highlighted by a green box)?\n(A) bath\n(B) toilet paper" }, { "from": "gpt", "value": "(A) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017956_455619500374875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of furniture (annotated by the red box) and furniture in the image provided, where is furniture (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649586_35289126383750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445689_61711872730125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739261_40040475861958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663377_92406406563375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from glass window (highlighted by a red box)? Choose from flower (highlighted by a blue box) and glass vase (highlighted by a green box).\n(A) flower\n(B) glass vase" }, { "from": "gpt", "value": "(B) glass vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204856_1719334803166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from screen door (highlighted by a red box)? Choose from screen door (highlighted by a blue box) and door (highlighted by a green box).\n(A) screen door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739969_18610374168583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, shelf (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) shelf\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331910_627547884560041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or laptop (highlighted by a blue box)?\n(A) chair\n(B) laptop" }, { "from": "gpt", "value": "(B) laptop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204481_24828571763291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) curtain\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261100_1153144547041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, microwave oven (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) microwave oven\n(B) appliance" }, { "from": "gpt", "value": "(A) microwave oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430217_180279205127958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to water (highlighted by a red box)? mat (highlighted by a blue box) or wide (highlighted by a green box).\n(A) mat\n(B) wide" }, { "from": "gpt", "value": "(B) wide" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895272_79404300622333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018616_633622408061916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, beach towel (highlighted by a red box) or tile (highlighted by a blue box)?\n(A) beach towel\n(B) tile" }, { "from": "gpt", "value": "(A) beach towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444524_4211638160750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, dish washer (highlighted by a red box) or door (highlighted by a blue box)?\n(A) dish washer\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333056_60179585430416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of lamp (annotated by the red box) in reference to appliance?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445639_58362770676041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from bath towel (highlighted by a red box), bath towel (highlighted by a blue box) or bunk bed (highlighted by a green box)?\n(A) bath towel\n(B) bunk bed" }, { "from": "gpt", "value": "(B) bunk bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331508_155193916947125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the material (highlighted by a red box)? cabinetry (highlighted by a blue box) or door (highlighted by a green box).\n(A) cabinetry\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649408_10112399050375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to picture frame (highlighted by a red box)? Choose from door (highlighted by a blue box) and door (highlighted by a green box).\n(A) door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333310_28222645198250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from flower (highlighted by a red box), chair (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899268_883866200897666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, balustrade (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) balustrade\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896089_143952089735833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, coffee machine (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) coffee machine\n(B) cabinetry" }, { "from": "gpt", "value": "(A) coffee machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334938_663139295615500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of toiletry (annotated by the red box) in reference to toiletry?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895637_471671701906041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from dresser (highlighted by a red box)? Choose among these: houseplant (highlighted by a blue box) or table lamp (highlighted by a green box).\n(A) houseplant\n(B) table lamp" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204449_23036979001583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to lamp (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and lamp (highlighted by a green box).\n(A) pillow\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333603_75440383867166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, furniture (highlighted by a red box) or television (highlighted by a blue box)?\n(A) furniture\n(B) television" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331053_482516014646916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to shelf (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and electric outlet (highlighted by a green box).\n(A) picture frame\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261695_525755706708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: sink (highlighted by a blue box) or countertop (highlighted by a green box).\n(A) sink\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796279_854667243500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, shower (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) shower\n(B) screen door" }, { "from": "gpt", "value": "(A) shower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895595_1161391174083791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bar stool (highlighted by a red box)? Choose among these: countertop (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) countertop\n(B) cabinetry" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018119_368563033917583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, houseplant (highlighted by a red box) or window (highlighted by a blue box)?\n(A) houseplant\n(B) window" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204330_14253718740666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) picture frame\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018549_830139024566666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from houseplant (highlighted by a red box)? Choose among these: radiator (highlighted by a blue box) or window sill (highlighted by a green box).\n(A) radiator\n(B) window sill" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899470_954197030281833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, electric outlet (highlighted by a red box) or door (highlighted by a blue box)?\n(A) electric outlet\n(B) door" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898917_816685234657916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to curtain (highlighted by a red box)? Select from door (highlighted by a blue box) and postcard (highlighted by a green box).\n(A) door\n(B) postcard" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358362_16351364807458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898006_219503938135416_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115424_4900909648541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toilet (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toilet\n(B) toiletry" }, { "from": "gpt", "value": "(A) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333973_47890982108666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, table (highlighted by a red box) or log (highlighted by a blue box)?\n(A) table\n(B) log" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333119_114291351477958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, air conditioning (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) air conditioning\n(B) cabinetry" }, { "from": "gpt", "value": "(A) air conditioning" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333960_46906139767208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) picture frame\n(B) bath mat" }, { "from": "gpt", "value": "(B) bath mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897783_129440229664375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of bathtub (annotated by the red box) in reference to soap dispenser?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334914_1090101672291666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, countertop (highlighted by a red box) or counter (highlighted by a blue box)?\n(A) countertop\n(B) counter" }, { "from": "gpt", "value": "(B) counter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333308_28041352249250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of chair (annotated by the red box) and tableware in the image provided, where is chair (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358386_19302754301958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from chair (highlighted by a red box)? lamp (highlighted by a blue box) or television (highlighted by a green box)?\n(A) lamp\n(B) television" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331217_281124343564500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to houseplant (highlighted by a red box)? Choose from houseplant (highlighted by a blue box) and window (highlighted by a green box).\n(A) houseplant\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018584_5606591998583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897757_117797214017333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to table (highlighted by a red box)? Choose from table lamp (highlighted by a blue box) and mat (highlighted by a green box).\n(A) table lamp\n(B) mat" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739455_51648395296708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, curtain (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) curtain\n(B) screen door" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331936_164610328171333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, curtain (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) curtain\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332599_362928114476416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is book (annotated by the red box) located in relation to basket in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204739_24121748050000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, door (highlighted by a red box) or potty (highlighted by a blue box)?\n(A) door\n(B) potty" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332609_363509422900958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or candle holder (highlighted by a blue box)?\n(A) chair\n(B) candle holder" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898541_180962760945708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from door (highlighted by a red box)? cabinetry (highlighted by a blue box) or counter top (highlighted by a green box)?\n(A) cabinetry\n(B) counter top" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333618_76287437925833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: bottle (highlighted by a blue box) or silver (highlighted by a green box).\n(A) bottle\n(B) silver" }, { "from": "gpt", "value": "(B) silver" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445627_58202070573083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, curtain (highlighted by a red box) or window (highlighted by a blue box)?\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895446_129392881518250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cleaning product (highlighted by a red box) or counter (highlighted by a blue box)?\n(A) cleaning product\n(B) counter" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358386_19232748692791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from armchair (highlighted by a red box)? Select from pillow (highlighted by a blue box) and coffee table (highlighted by a green box).\n(A) pillow\n(B) coffee table" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333882_77118466376916_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331522_190754284311208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from oven (highlighted by a red box)? Choose among these: bottle (highlighted by a blue box) or dish washer (highlighted by a green box).\n(A) bottle\n(B) dish washer" }, { "from": "gpt", "value": "(B) dish washer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204493_26423326987416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, porcelain (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) porcelain\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458503_113289973870250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444712_73960205889125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bed (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) bed\n(B) pillow" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895263_78420190138458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the towel/napkin (highlighted by a red box)? bathrobe (highlighted by a blue box) or drawer (highlighted by a green box).\n(A) bathrobe\n(B) drawer" }, { "from": "gpt", "value": "(B) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896304_6870138921708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, kitchen appliance (highlighted by a red box) or silverware (highlighted by a blue box)?\n(A) kitchen appliance\n(B) silverware" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115238_97794878029166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, suitcase (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) suitcase\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333574_207547835667208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, shelf (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) shelf\n(B) picture frame" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663313_76554275070500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toiletry (highlighted by a red box), bottle (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) bottle\n(B) cabinetry" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649654_40655895273083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from pillow (highlighted by a red box)? Select from book (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) book\n(B) pillow" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897434_104165226110166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, studio couch (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) studio couch\n(B) table lamp" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334787_426458970917750_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895250_75596296321708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, desk (highlighted by a red box) or mouse (highlighted by a blue box)?\n(A) desk\n(B) mouse" }, { "from": "gpt", "value": "(B) mouse" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334754_421189702644333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from radiator (highlighted by a red box)? Choose among these: window screen (highlighted by a blue box) or armchair (highlighted by a green box).\n(A) window screen\n(B) armchair" }, { "from": "gpt", "value": "(B) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444511_3395841668000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, mouthwash (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) mouthwash\n(B) tap" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332810_48238824669083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445804_67806408152541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, air conditioning (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) air conditioning\n(B) radiator" }, { "from": "gpt", "value": "(A) air conditioning" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445047_1899734637583_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895837_1222462105865625_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115394_3374869555708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to home appliance (highlighted by a red box)? Choose from appliance (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261406_29806800511208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bulletin board (highlighted by a red box) or art (highlighted by a blue box)?\n(A) bulletin board\n(B) art" }, { "from": "gpt", "value": "(B) art" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358472_46644377090916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018098_367330615542166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, hanger (highlighted by a red box) or fancy dress (highlighted by a blue box)?\n(A) hanger\n(B) fancy dress" }, { "from": "gpt", "value": "(B) fancy dress" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899944_864848026148166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chest of drawers (highlighted by a red box) or vanity (highlighted by a blue box)?\n(A) chest of drawers\n(B) vanity" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430716_335297812269625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from mat (highlighted by a red box)? Choose from table (highlighted by a blue box) and stool (highlighted by a green box).\n(A) table\n(B) stool" }, { "from": "gpt", "value": "(B) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897898_345304800500291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from computer monitor (highlighted by a red box)? table (highlighted by a blue box) or desk (highlighted by a green box)?\n(A) table\n(B) desk" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204493_26366416212833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bathtub (highlighted by a red box)? Choose among these: shower door (highlighted by a blue box) or toilet paper (highlighted by a green box).\n(A) shower door\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649382_10600251912750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the picture frame (highlighted by a red box)? mirror (highlighted by a blue box) or table lamp (highlighted by a green box).\n(A) mirror\n(B) table lamp" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895995_136134409726040_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from box (highlighted by a red box)? Choose from coffee cup (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) coffee cup\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898007_219405144588458_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444908_106390666825291_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204305_15314267774625_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669911_12702898790125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, bath (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) bath\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331220_282481911891666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, screen door (highlighted by a red box) or light switch (highlighted by a blue box)?\n(A) screen door\n(B) light switch" }, { "from": "gpt", "value": "(B) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898256_696504040872833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or bookcase (highlighted by a blue box)?\n(A) picture frame\n(B) bookcase" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333152_40332317989791_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018846_649903719033708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of refrigerator (annotated by the red box) and paper in the image provided, where is refrigerator (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24682503885083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to houseplant (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) cabinetry\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204519_1686070671083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or cage (highlighted by a blue box)?\n(A) furniture\n(B) cage" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333203_46890942191083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bird cage (highlighted by a red box) or table (highlighted by a blue box)?\n(A) bird cage\n(B) table" }, { "from": "gpt", "value": "(A) bird cage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663065_38343990484625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to home appliance (highlighted by a red box)? Choose from kitchen appliance (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) kitchen appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897948_351387915547833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, desk (highlighted by a red box) or rail (highlighted by a blue box)?\n(A) desk\n(B) rail" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115127_84750936633666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to chair (highlighted by a red box)? chair (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) chair\n(B) appliance" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895191_38643728328750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from bidet (highlighted by a red box)? Choose from material (highlighted by a blue box) and cleaning product (highlighted by a green box).\n(A) material\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445692_63082573997291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, plain (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) plain\n(B) pillow" }, { "from": "gpt", "value": "(A) plain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334890_623263952987708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, cleaning product (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) cleaning product\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332592_362589778451041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from bottle (highlighted by a red box), bottle (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) bottle\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897512_472712501484375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, shelf (highlighted by a red box) or box (highlighted by a blue box)?\n(A) shelf\n(B) box" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261206_11656466902041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649686_36168961328208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toilet bowl (highlighted by a red box), curtain (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) curtain\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115235_95859245943875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to curtain (highlighted by a red box)? picture frame (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) picture frame\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446462_354254425023916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) chair\n(B) bottle" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332305_387209825192416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or window (highlighted by a blue box)?\n(A) door\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895956_133469160181541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or stool (highlighted by a blue box)?\n(A) chair\n(B) stool" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115177_104347247893541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or air conditioner (highlighted by a blue box)?\n(A) picture frame\n(B) air conditioner" }, { "from": "gpt", "value": "(B) air conditioner" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458552_127491438704583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of pillow (annotated by the red box) and pillow in the image provided, where is pillow (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458597_125187351661625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, toilet (highlighted by a red box) or blanket (highlighted by a blue box)?\n(A) toilet\n(B) blanket" }, { "from": "gpt", "value": "(A) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670179_43155768462875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, shower (highlighted by a red box) or air conditioner (highlighted by a blue box)?\n(A) shower\n(B) air conditioner" }, { "from": "gpt", "value": "(A) shower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358710_5073859497500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the window (highlighted by a red box)? houseplant (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895272_79356103556916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to kitchen appliance (highlighted by a red box)? Choose from appliance (highlighted by a blue box) and kitchen appliance (highlighted by a green box).\n(A) appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204451_22977185983375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to glass door (highlighted by a red box), table (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358362_16158158183208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) curtain\n(B) lamp" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_408958908945625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of chair (annotated by the red box) in reference to chair?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334020_271665997234416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bottle (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) bottle\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331589_15935285362125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or window (highlighted by a blue box)?\n(A) picture frame\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333310_28196639126833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) picture frame\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204852_1517535063333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from soap dispenser (highlighted by a red box)? Choose from plumbing fixture (highlighted by a blue box) and soap dispenser (highlighted by a green box).\n(A) plumbing fixture\n(B) soap dispenser" }, { "from": "gpt", "value": "(A) plumbing fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662995_30717594122166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to toiletry (highlighted by a red box), bidet (highlighted by a blue box) or sink (highlighted by a green box)?\n(A) bidet\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429766_358344251309208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, light fixture (highlighted by a red box) or beach towel (highlighted by a blue box)?\n(A) light fixture\n(B) beach towel" }, { "from": "gpt", "value": "(B) beach towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444787_50401101990291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from furniture (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and window (highlighted by a green box).\n(A) furniture\n(B) window" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897728_114274438476791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from curtain (highlighted by a red box)? Choose among these: basket (highlighted by a blue box) or glass door (highlighted by a green box).\n(A) basket\n(B) glass door" }, { "from": "gpt", "value": "(A) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899898_1027116740579083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to furniture (highlighted by a red box)? Choose from lamp (highlighted by a blue box) and tableware (highlighted by a green box).\n(A) lamp\n(B) tableware" }, { "from": "gpt", "value": "(B) tableware" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895908_110710939970208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from door (highlighted by a red box)? Choose from window (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) window\n(B) pillow" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333040_59718763520000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, counter (highlighted by a red box) or bowl (highlighted by a blue box)?\n(A) counter\n(B) bowl" }, { "from": "gpt", "value": "(B) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358170_62336543841666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445684_61935662707750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, glass door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) glass door\n(B) door" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897480_470971422846833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, window screen (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) window screen\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358111_61665900963083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from tableware (highlighted by a red box), chair (highlighted by a blue box) or mirror (highlighted by a green box)?\n(A) chair\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896169_140661521291833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to studio couch (highlighted by a red box), picture frame (highlighted by a blue box) or fireplace (highlighted by a green box)?\n(A) picture frame\n(B) fireplace" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898651_572747826157625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896083_144015896657208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895987_136450111740958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from magazine (highlighted by a red box)? picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796475_4266923555624_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chest of drawers (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) chest of drawers\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430298_187476753920625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the nightstand (highlighted by a red box)? chest of drawers (highlighted by a blue box) or table lamp (highlighted by a green box).\n(A) chest of drawers\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429736_19985662001666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from toy (highlighted by a red box)? Select from shelf (highlighted by a blue box) and toy (highlighted by a green box).\n(A) shelf\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445613_56556808446000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, home appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) home appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334213_105718191039375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from chair (highlighted by a red box)? Choose from shelf (highlighted by a blue box) and shelf (highlighted by a green box).\n(A) shelf\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331281_14160598370041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the toilet paper (highlighted by a red box)? Choose among these: bath towel (highlighted by a blue box) or toilet paper (highlighted by a green box).\n(A) bath towel\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333472_58500637005291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, shelf (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) shelf\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445584_283422764969291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, extension cord (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) extension cord\n(B) toilet paper" }, { "from": "gpt", "value": "(A) extension cord" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663415_95828666291708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the pillow (highlighted by a red box)? television (highlighted by a blue box) or table lamp (highlighted by a green box).\n(A) television\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444923_220881345501000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from light switch (highlighted by a red box)? Choose among these: window (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334189_354711364799583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, counter top (highlighted by a red box) or magazine (highlighted by a blue box)?\n(A) counter top\n(B) magazine" }, { "from": "gpt", "value": "(B) magazine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334193_355733424655458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from toilet paper (highlighted by a red box)? appliance (highlighted by a blue box) or power plugs and sockets (highlighted by a green box)?\n(A) appliance\n(B) power plugs and sockets" }, { "from": "gpt", "value": "(B) power plugs and sockets" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333319_28465146001416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, plant (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) plant\n(B) houseplant" }, { "from": "gpt", "value": "(A) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899034_643257122546125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334284_161085340874375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to control (highlighted by a red box), control (highlighted by a blue box) or desk (highlighted by a green box)?\n(A) control\n(B) desk" }, { "from": "gpt", "value": "(A) control" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334074_88966780529833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, book (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) book\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898215_145784668380250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the chair (highlighted by a red box)? Choose among these: floral arrangement (highlighted by a blue box) or lighting (highlighted by a green box).\n(A) floral arrangement\n(B) lighting" }, { "from": "gpt", "value": "(B) lighting" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430455_1820741486583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to table lamp (highlighted by a red box)? Select from furniture (highlighted by a blue box) and computer monitor (highlighted by a green box).\n(A) furniture\n(B) computer monitor" }, { "from": "gpt", "value": "(B) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444574_31907797252000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, screen door (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) screen door\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334025_271606787696833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bottle (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) cabinetry\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115448_11714943203333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to bulletin board (highlighted by a red box)? window screen (highlighted by a blue box) or mirror (highlighted by a green box).\n(A) window screen\n(B) mirror" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895975_134609612081166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261452_35741946056625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) picture frame\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796446_613712478458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bedside lamp (highlighted by a red box)? Choose among these: bed (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) bed\n(B) pillow" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895868_107564776217125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or plant (highlighted by a blue box)?\n(A) picture frame\n(B) plant" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739563_198388149527875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, appliance (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) appliance\n(B) chair" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649589_35337423053125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, gas stove (highlighted by a red box) or oven (highlighted by a blue box)?\n(A) gas stove\n(B) oven" }, { "from": "gpt", "value": "(B) oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332592_362600890624500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the toilet paper (highlighted by a red box)? bath towel (highlighted by a blue box) or shower door (highlighted by a green box).\n(A) bath towel\n(B) shower door" }, { "from": "gpt", "value": "(B) shower door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899573_959550532447625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358173_62521037468625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, furniture (highlighted by a red box) or tile (highlighted by a blue box)?\n(A) furniture\n(B) tile" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333862_75558751335875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from toiletry (highlighted by a red box)? toiletry (highlighted by a blue box) or mirror (highlighted by a green box)?\n(A) toiletry\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115650_4735441753291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the picture frame (highlighted by a red box)? Choose among these: window sill (highlighted by a blue box) or chair (highlighted by a green box).\n(A) window sill\n(B) chair" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018273_794986082606041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) door\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204449_23042976629250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, furniture (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) furniture\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895272_79342109243333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bottle (highlighted by a red box)? Choose among these: cutting board (highlighted by a blue box) or tap (highlighted by a green box).\n(A) cutting board\n(B) tap" }, { "from": "gpt", "value": "(A) cutting board" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796438_664624705833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, window (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) window\n(B) chair" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429835_748693937936250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from box (highlighted by a red box)? Choose among these: box (highlighted by a blue box) or bag (highlighted by a green box).\n(A) box\n(B) bag" }, { "from": "gpt", "value": "(B) bag" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431088_75896062773333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, poster (highlighted by a red box) or plywood (highlighted by a blue box)?\n(A) poster\n(B) plywood" }, { "from": "gpt", "value": "(B) plywood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333994_50494771470458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, food (highlighted by a red box) or food (highlighted by a blue box)?\n(A) food\n(B) food" }, { "from": "gpt", "value": "(B) food" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899630_229923271545416_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332490_341189081671208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, tap (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) tap\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895956_133475157699125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bottle (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) bottle\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204341_14962194669666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is picture frame (annotated by the red box) located in relation to picture frame in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358700_5186664741083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from shelf (highlighted by a red box)? Choose from basket (highlighted by a blue box) and counter (highlighted by a green box).\n(A) basket\n(B) counter" }, { "from": "gpt", "value": "(A) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333274_24116602119875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, studio couch (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) studio couch\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895298_90972837947833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898716_582164145065375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from bed (highlighted by a red box)? table lamp (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334614_385150252406666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the shelf (highlighted by a red box)? Choose among these: cardboard box (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) cardboard box\n(B) lamp" }, { "from": "gpt", "value": "(A) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334608_384985852347083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, guitar (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) guitar\n(B) curtain" }, { "from": "gpt", "value": "(A) guitar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204670_12431136453416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or couch (highlighted by a blue box)?\n(A) door\n(B) couch" }, { "from": "gpt", "value": "(B) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333670_133974158220416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from picnic basket (highlighted by a red box)? Choose from storage box (highlighted by a blue box) and book (highlighted by a green box).\n(A) storage box\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895920_112136000333375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, yoga mat (highlighted by a red box) or box (highlighted by a blue box)?\n(A) yoga mat\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430860_74440594690166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the doormat (highlighted by a red box)? laundry (highlighted by a blue box) or door (highlighted by a green box).\n(A) laundry\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261292_16324741602791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from bed (highlighted by a red box)? Select from pillow (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) pillow\n(B) cabinetry" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261087_400868704333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toy (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) toy\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896304_6854145256291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895871_489440485169416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from tile (highlighted by a red box)? cabinetry (highlighted by a blue box) or kitchen appliance (highlighted by a green box)?\n(A) cabinetry\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670008_30401590812083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) table\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115240_97890871606458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of table (annotated by the red box) and studio couch in the image provided, where is table (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444695_72592572305375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, dresser (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) dresser\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334079_88650775433958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from window blind (highlighted by a red box)? Choose from plant (highlighted by a blue box) and counter (highlighted by a green box).\n(A) plant\n(B) counter" }, { "from": "gpt", "value": "(B) counter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895911_111458840832875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, sink (highlighted by a red box) or stairwell (highlighted by a blue box)?\n(A) sink\n(B) stairwell" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445955_130023548479041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to picture frame (highlighted by a red box)? pillow (highlighted by a blue box) or book (highlighted by a green box).\n(A) pillow\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670346_66286495600833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to cabinetry (highlighted by a red box), door (highlighted by a blue box) or drawer (highlighted by a green box)?\n(A) door\n(B) drawer" }, { "from": "gpt", "value": "(B) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430442_724451862333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from tablecloth (highlighted by a red box)? table (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899489_197728540129750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, plant (highlighted by a red box) or kitchen & dining room table (highlighted by a blue box)?\n(A) plant\n(B) kitchen & dining room table" }, { "from": "gpt", "value": "(B) kitchen & dining room table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898006_219503938135416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhere is window (annotated by the red box) located in relation to electric outlet in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429728_19226435666166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chest of drawers (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) chest of drawers\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331343_192421407890708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, computer monitor (highlighted by a red box) or book (highlighted by a blue box)?\n(A) computer monitor\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260957_5974303194625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to concrete (highlighted by a red box), door (highlighted by a blue box) or shower curtain (highlighted by a green box)?\n(A) door\n(B) shower curtain" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670100_41151117527833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of bedding (annotated by the red box) in reference to pillow? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444708_73339462238625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662996_30848389857583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from clothing (highlighted by a red box)? Choose from radiator (highlighted by a blue box) and towel (highlighted by a green box).\n(A) radiator\n(B) towel" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430262_185381419761000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, coffee cup (highlighted by a red box) or glass plate (highlighted by a blue box)?\n(A) coffee cup\n(B) glass plate" }, { "from": "gpt", "value": "(A) coffee cup" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458231_78552009472250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458584_1634374923166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bathtub (highlighted by a red box)? Select from screen door (highlighted by a blue box) and toiletry (highlighted by a green box).\n(A) screen door\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669959_27728101250208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to cabinetry (highlighted by a red box)? Select from appliance (highlighted by a blue box) and countertop (highlighted by a green box).\n(A) appliance\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430236_181828471643250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, curtain (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) curtain\n(B) clothing" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430269_185575607670375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, studio couch (highlighted by a red box) or coffee table (highlighted by a blue box)?\n(A) studio couch\n(B) coffee table" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897818_132712693085250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, lamp (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332195_263838943839958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, toilet paper (highlighted by a red box) or water pipe (highlighted by a blue box)?\n(A) toilet paper\n(B) water pipe" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358472_46638379465041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, desk (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) desk\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358241_10521414308083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, toilet (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) toilet\n(B) basket" }, { "from": "gpt", "value": "(A) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332648_369071270552666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to basket (highlighted by a red box), picture frame (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) picture frame\n(B) shelf" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828245_81729397898333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, lamp (highlighted by a red box) or plant (highlighted by a blue box)?\n(A) lamp\n(B) plant" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739426_191832708090666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bathroom cabinet (highlighted by a red box)? Choose from sink (highlighted by a blue box) and liquid (highlighted by a green box).\n(A) sink\n(B) liquid" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895449_129285092056333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from counter top (highlighted by a red box)? toiletry (highlighted by a blue box) or mouthwash (highlighted by a green box)?\n(A) toiletry\n(B) mouthwash" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896419_17702730782375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, throw pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) throw pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) throw pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429752_355462979891208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from mat (highlighted by a red box)? table (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662912_19999751168416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, nightstand (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) nightstand\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828361_80321924665625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: window sill (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) window sill\n(B) picture frame" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115650_4757649635041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to pillow (highlighted by a red box)? table lamp (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445587_284606242029500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, mirror (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) mirror\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895797_680594395574041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the studio couch (highlighted by a red box)? Choose among these: curtain (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) curtain\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332383_398672523029625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the door (highlighted by a red box)? clock (highlighted by a blue box) or door (highlighted by a green box).\n(A) clock\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018817_20123049872750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, toothpaste (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toothpaste\n(B) toiletry" }, { "from": "gpt", "value": "(A) toothpaste" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333589_208754089882875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cleaning product (highlighted by a red box) or mouthwash (highlighted by a blue box)?\n(A) cleaning product\n(B) mouthwash" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739635_2330152232750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, sink (highlighted by a red box) or bath (highlighted by a blue box)?\n(A) sink\n(B) bath" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261658_1201339626000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, door (highlighted by a red box) or bowl (highlighted by a blue box)?\n(A) door\n(B) bowl" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332290_385319604409541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from lamp (highlighted by a red box)? cabinetry (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) cabinetry\n(B) chair" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445869_71893584010375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458503_113303968336541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of furniture (annotated by the red box) in reference to wheel? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896009_137112268861833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to studio couch (highlighted by a red box)? Choose from chair (highlighted by a blue box) and chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204763_26789611181458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, screen door (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) screen door\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261294_16244839846666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of door (annotated by the red box) and person in the image provided, where is door (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334608_384977755619166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chest of drawers (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) chest of drawers\n(B) basket" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445583_283661366713750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) table\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331277_13162250550083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, television (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) television\n(B) studio couch" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670133_40059876774833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, sink (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) sink\n(B) bottle" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662897_19437206277750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to door handle (highlighted by a red box), radiator (highlighted by a blue box) or door (highlighted by a green box)?\n(A) radiator\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445057_3337087856833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, box (highlighted by a red box) or linen (highlighted by a blue box)?\n(A) box\n(B) linen" }, { "from": "gpt", "value": "(B) linen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261686_3855942293875_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429664_9088964756750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, plant (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) plant\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828555_101357520027208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, sink (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) sink\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115575_2533608715125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to appliance (highlighted by a red box)? Choose from appliance (highlighted by a blue box) and electric outlet (highlighted by a green box).\n(A) appliance\n(B) electric outlet" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261080_343359150250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, baby carriage (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) baby carriage\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828334_79051124195416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from flowerpot (highlighted by a red box)? coffee table (highlighted by a blue box) or window sill (highlighted by a green box)?\n(A) coffee table\n(B) window sill" }, { "from": "gpt", "value": "(A) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429762_356798156161000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, furniture (highlighted by a red box) or cage (highlighted by a blue box)?\n(A) furniture\n(B) cage" }, { "from": "gpt", "value": "(B) cage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018829_647480572264250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to material (highlighted by a red box)? pillow (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) pillow\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334027_273694512943541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or table (highlighted by a blue box)?\n(A) door\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018296_800239606867791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bottle (highlighted by a red box)? Choose among these: cleaning product (highlighted by a blue box) or toilet paper (highlighted by a green box).\n(A) cleaning product\n(B) toilet paper" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895868_107596762977041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from desk (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or door (highlighted by a green box).\n(A) chair\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445955_130002340506750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, reindeer (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) reindeer\n(B) table lamp" }, { "from": "gpt", "value": "(A) reindeer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429855_12666741837583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to soap dispenser (highlighted by a red box), electric outlet (highlighted by a blue box) or soap (highlighted by a green box)?\n(A) electric outlet\n(B) soap" }, { "from": "gpt", "value": "(B) soap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669925_14091269017000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to plain (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) picture frame\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333480_60197698019208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to light switch (highlighted by a red box)? Select from door (highlighted by a blue box) and cupboard (highlighted by a green box).\n(A) door\n(B) cupboard" }, { "from": "gpt", "value": "(B) cupboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332184_262566819747000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window (highlighted by a red box), lamp (highlighted by a blue box) or bed frame (highlighted by a green box)?\n(A) lamp\n(B) bed frame" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896188_141847427328250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from screen door (highlighted by a red box)? Select from material (highlighted by a blue box) and furniture (highlighted by a green box).\n(A) material\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331358_194789933385333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, mouthwash (highlighted by a red box) or mouthwash (highlighted by a blue box)?\n(A) mouthwash\n(B) mouthwash" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458781_143455746282416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cabinetry (highlighted by a red box)? kitchen appliance (highlighted by a blue box) or counter top (highlighted by a green box)?\n(A) kitchen appliance\n(B) counter top" }, { "from": "gpt", "value": "(B) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204363_15834916756666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from material (highlighted by a red box)? studio couch (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429874_14083586826541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is bedside lamp (annotated by the red box) located in relation to chest of drawers in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115180_104075738603625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to mirror (highlighted by a red box)? Select from sink (highlighted by a blue box) and mirror (highlighted by a green box).\n(A) sink\n(B) mirror" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017888_79795308346375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) furniture\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261169_1305171147166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) picture frame\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796271_703960921916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from toilet (highlighted by a red box)? Choose from mirror (highlighted by a blue box) and tap (highlighted by a green box).\n(A) mirror\n(B) tap" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458700_135296786273333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, radiator (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) radiator\n(B) chair" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895635_471849895993083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, table (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) table\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447287_408746596613416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, paper towel (highlighted by a red box) or coffee machine (highlighted by a blue box)?\n(A) paper towel\n(B) coffee machine" }, { "from": "gpt", "value": "(A) paper towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430585_310610518163000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from dresser (highlighted by a red box)? Choose among these: furniture (highlighted by a blue box) or swivel chair (highlighted by a green box).\n(A) furniture\n(B) swivel chair" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261172_1510056814333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, curtain (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) curtain\n(B) window screen" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331491_153115626604791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, studio couch (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) studio couch\n(B) toy" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669959_27782095505583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from glass door (highlighted by a red box)? door (highlighted by a blue box) or garbage (highlighted by a green box)?\n(A) door\n(B) garbage" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899970_656467942625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from book (highlighted by a red box)? book (highlighted by a blue box) or table (highlighted by a green box)?\n(A) book\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332177_262456114512457_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the shelf (highlighted by a red box)? Choose among these: curtain (highlighted by a blue box) or window (highlighted by a green box).\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204741_25164088478125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is picture frame (annotated by the red box) located relative to picture frame?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358117_62372096019791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from screen door (highlighted by a red box), round table (highlighted by a blue box) or table (highlighted by a green box)?\n(A) round table\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895987_136320715691583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261355_25783232966583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, refrigerator (highlighted by a red box) or material (highlighted by a blue box)?\n(A) refrigerator\n(B) material" }, { "from": "gpt", "value": "(B) material" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332106_683042010079125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, changing table (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) changing table\n(B) bed" }, { "from": "gpt", "value": "(A) changing table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828478_100760746271000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table lamp (highlighted by a red box) or window (highlighted by a blue box)?\n(A) table lamp\n(B) window" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358162_60956731348375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the window frame (highlighted by a red box)? mirror (highlighted by a blue box) or window frame (highlighted by a green box).\n(A) mirror\n(B) window frame" }, { "from": "gpt", "value": "(B) window frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333581_207644030208166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bean bag chair (highlighted by a red box)? Select from cardboard box (highlighted by a blue box) and chair (highlighted by a green box).\n(A) cardboard box\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261339_23949434998583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from studio couch (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or bowl (highlighted by a green box).\n(A) pillow\n(B) bowl" }, { "from": "gpt", "value": "(B) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896419_17708728392083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or door (highlighted by a blue box)?\n(A) chair\n(B) door" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897755_117582119850666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from table lamp (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649384_11069209833250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) table\n(B) curtain" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828368_92119529743750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, mirror (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) mirror\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115448_11742548445000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, oval (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) oval\n(B) sink" }, { "from": "gpt", "value": "(A) oval" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331277_13051945697458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331177_277412197829583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from book (highlighted by a red box)? book (highlighted by a blue box) or toy (highlighted by a green box)?\n(A) book\n(B) toy" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796463_3595705315125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, mirror (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) mirror\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897818_132722689125166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), bed (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) bed\n(B) lamp" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331091_134659015013791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to pillow (highlighted by a red box)? window sill (highlighted by a blue box) or car (highlighted by a green box).\n(A) window sill\n(B) car" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334286_161209640430083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, appliance (highlighted by a red box) or food (highlighted by a blue box)?\n(A) appliance\n(B) food" }, { "from": "gpt", "value": "(B) food" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649440_12593546102041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from houseplant (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and door (highlighted by a green box).\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430854_74220199017291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chest of drawers (highlighted by a red box)? storage box (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) storage box\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204376_18195731831666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to studio couch (highlighted by a red box), pillow (highlighted by a blue box) or swivel chair (highlighted by a green box)?\n(A) pillow\n(B) swivel chair" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333201_47040148293458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to furniture (highlighted by a red box)? Select from screen door (highlighted by a blue box) and door (highlighted by a green box).\n(A) screen door\n(B) door" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204376_18225719969500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from swivel chair (highlighted by a red box)? Choose from radiator (highlighted by a blue box) and toy (highlighted by a green box).\n(A) radiator\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649426_10831400225333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from appliance (highlighted by a red box)? countertop (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) countertop\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898041_222048019153291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from picture frame (highlighted by a red box)? door (highlighted by a blue box) or door (highlighted by a green box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446462_354122328912875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from book (highlighted by a red box)? shelf (highlighted by a blue box) or book (highlighted by a green box)?\n(A) shelf\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333308_28123352292375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the picture frame (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669937_14916694673166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to screen door (highlighted by a red box)? Select from washing machine (highlighted by a blue box) and recycling bin (highlighted by a green box).\n(A) washing machine\n(B) recycling bin" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458202_74813071413625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to book (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332519_415964438991041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of electric outlet (annotated by the red box) and table in the image provided, where is electric outlet (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662962_24744091313750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, faucet (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) faucet\n(B) shelf" }, { "from": "gpt", "value": "(A) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649794_46058808688916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the fireplace (highlighted by a red box)? studio couch (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) studio couch\n(B) studio couch" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669959_27752091297666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from cabinetry (highlighted by a red box), cabinetry (highlighted by a blue box) or window (highlighted by a green box)?\n(A) cabinetry\n(B) window" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669880_11184304622083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898958_821413890503541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from electric outlet (highlighted by a red box)? kitchen appliance (highlighted by a blue box) or toaster (highlighted by a green box)?\n(A) kitchen appliance\n(B) toaster" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115394_3405274192333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to window (highlighted by a red box)? Select from screen door (highlighted by a blue box) and clock (highlighted by a green box).\n(A) screen door\n(B) clock" }, { "from": "gpt", "value": "(B) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333332_30027929327125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, machine (highlighted by a red box) or towel (highlighted by a blue box)?\n(A) machine\n(B) towel" }, { "from": "gpt", "value": "(A) machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895960_133637856943083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) picture frame\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471429816250083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, desk (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) desk\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444925_220829649924833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from curtain (highlighted by a red box)? Choose from curtain (highlighted by a blue box) and window (highlighted by a green box).\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828362_80386132595833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, television (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) television\n(B) window sill" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334966_669469076183666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334074_88862572900541_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446493_356484651112958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window (highlighted by a red box) or light fixture (highlighted by a blue box)?\n(A) window\n(B) light fixture" }, { "from": "gpt", "value": "(B) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334489_104620220244375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, desk (highlighted by a red box) or television (highlighted by a blue box)?\n(A) desk\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333233_32389962263125_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430065_34689192963708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bath mat (highlighted by a red box) or step stool (highlighted by a blue box)?\n(A) bath mat\n(B) step stool" }, { "from": "gpt", "value": "(A) bath mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649603_36069596364166_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649391_10997406238958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, curtain (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) curtain\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796721_27299884783458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cabinetry (highlighted by a red box)? Choose from kitchen appliance (highlighted by a blue box) and chair (highlighted by a green box).\n(A) kitchen appliance\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261384_27695059222208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from round table (highlighted by a red box), pillow (highlighted by a blue box) or fireplace (highlighted by a green box)?\n(A) pillow\n(B) fireplace" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332769_43716027996375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cabinetry (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) cabinetry\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430246_182507578817208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, book (highlighted by a red box) or bookcase (highlighted by a blue box)?\n(A) book\n(B) bookcase" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896308_6720631428000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or material (highlighted by a blue box)?\n(A) chair\n(B) material" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471655822159875_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898903_817313727716000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or door (highlighted by a blue box)?\n(A) curtain\n(B) door" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446057_79927969728625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of window (annotated by the red box) in reference to plank? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333801_51177549473666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261317_23567473559833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from book (highlighted by a red box), book (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) book\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430739_336606528228208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, candle (highlighted by a red box) or candle (highlighted by a blue box)?\n(A) candle\n(B) candle" }, { "from": "gpt", "value": "(B) candle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649722_48889918927166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of sheet (annotated by the red box) and throw pillow in the image provided, where is sheet (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430739_336548535437000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to houseplant (highlighted by a red box)? Select from vase (highlighted by a blue box) and dresser (highlighted by a green box).\n(A) vase\n(B) dresser" }, { "from": "gpt", "value": "(A) vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261297_16373638938333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the door (highlighted by a red box)? picture frame (highlighted by a blue box) or door (highlighted by a green box).\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24651499955875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to houseplant (highlighted by a red box)? houseplant (highlighted by a blue box) or stationary bicycle (highlighted by a green box).\n(A) houseplant\n(B) stationary bicycle" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899221_188385777281666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is cupboard (annotated by the red box) located relative to chest of drawers?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899953_865653661650416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, door (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) door\n(B) mat" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896009_137116267195291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from picture frame (highlighted by a red box)? Choose from lamp (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204820_28681214329833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, lamp (highlighted by a red box) or tableware (highlighted by a blue box)?\n(A) lamp\n(B) tableware" }, { "from": "gpt", "value": "(B) tableware" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663363_91156702273791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the appliance (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) cabinetry\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358345_15136825847708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to appliance (highlighted by a red box)? Choose from gas stove (highlighted by a blue box) and concrete (highlighted by a green box).\n(A) gas stove\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261532_74100428295583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window screen (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) window screen\n(B) pillow" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334935_663032888719708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670208_54051668071000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cabinetry (highlighted by a red box) or countertop (highlighted by a blue box)?\n(A) cabinetry\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260952_6016303250416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, furniture (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) furniture\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261219_13544821505833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from houseplant (highlighted by a red box), houseplant (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445211_10816314386916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, swivel chair (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) swivel chair\n(B) picture frame" }, { "from": "gpt", "value": "(A) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331105_135612980734290_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431106_348247288943875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to mouthwash (highlighted by a red box)? Choose from mouthwash (highlighted by a blue box) and mouthwash (highlighted by a green box).\n(A) mouthwash\n(B) mouthwash" }, { "from": "gpt", "value": "(B) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261524_45742747877375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to bookcase (highlighted by a red box), wall clock (highlighted by a blue box) or book (highlighted by a green box)?\n(A) wall clock\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739698_1558413992916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from air conditioner (highlighted by a red box)? Choose among these: screen door (highlighted by a blue box) or door (highlighted by a green box).\n(A) screen door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899916_1028227464014916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334037_278572911964165_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of miniature (annotated by the red box) in reference to pillow? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333149_40363721904041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of door (annotated by the red box) in relation to postcard?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115427_4863607731916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) window\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739690_1162136823958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, curtain (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) curtain\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663317_76518773097208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of cupboard (annotated by the red box) and light in the image provided, where is cupboard (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458781_143469757395291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is fridge (annotated by the red box) located in relation to window in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261406_29728698061833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897643_146916178300958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from appliance (highlighted by a red box)? coffee table (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) coffee table\n(B) appliance" }, { "from": "gpt", "value": "(A) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649451_12695239189541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the clothing (highlighted by a red box)? Choose among these: clothing (highlighted by a blue box) or wall clock (highlighted by a green box).\n(A) clothing\n(B) wall clock" }, { "from": "gpt", "value": "(A) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204519_1658082328750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from plastic bag (highlighted by a red box)? furniture (highlighted by a blue box) or plastic bag (highlighted by a green box)?\n(A) furniture\n(B) plastic bag" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670150_40531639926583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or path (highlighted by a blue box)?\n(A) door\n(B) path" }, { "from": "gpt", "value": "(B) path" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899912_1028442659243333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, towel (highlighted by a red box) or towel (highlighted by a blue box)?\n(A) towel\n(B) towel" }, { "from": "gpt", "value": "(B) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447275_408627612215750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to electric outlet (highlighted by a red box)? Choose from electric outlet (highlighted by a blue box) and cupboard (highlighted by a green box).\n(A) electric outlet\n(B) cupboard" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899817_254879753200500_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332991_125332093803916_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333055_60266983337208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, houseplant (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649688_36018454206750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of towel (annotated by the red box) and cloak in the image provided, where is towel (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331165_274212575284583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table lamp (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899642_232010291351666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to towel (highlighted by a red box), towel (highlighted by a blue box) or towel (highlighted by a green box)?\n(A) towel\n(B) towel" }, { "from": "gpt", "value": "(A) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115174_104168735147208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, curtain (highlighted by a red box) or window blind (highlighted by a blue box)?\n(A) curtain\n(B) window blind" }, { "from": "gpt", "value": "(B) window blind" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331935_163734184615666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to coffee cup (highlighted by a red box)? Choose from door (highlighted by a blue box) and studio couch (highlighted by a green box).\n(A) door\n(B) studio couch" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898221_164135429382083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to doormat (highlighted by a red box), footwear (highlighted by a blue box) or refrigerator (highlighted by a green box)?\n(A) footwear\n(B) refrigerator" }, { "from": "gpt", "value": "(B) refrigerator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899600_202571226232041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or bedside lamp (highlighted by a blue box)?\n(A) table\n(B) bedside lamp" }, { "from": "gpt", "value": "(B) bedside lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429798_737339926178708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bulletin board (highlighted by a red box)? lamp (highlighted by a blue box) or bulletin board (highlighted by a green box).\n(A) lamp\n(B) bulletin board" }, { "from": "gpt", "value": "(B) bulletin board" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018828_647388976100458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the furniture (highlighted by a red box)? Choose among these: table (highlighted by a blue box) or storage box (highlighted by a green box).\n(A) table\n(B) storage box" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895938_107707524057791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bed (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) bed\n(B) pillow" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332812_48055932830375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from appliance (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or coffee machine (highlighted by a green box).\n(A) cabinetry\n(B) coffee machine" }, { "from": "gpt", "value": "(B) coffee machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662839_15772951310083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from picture frame (highlighted by a red box)? table (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) table\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828478_100780754641875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chair (highlighted by a red box)? wine glass (highlighted by a blue box) or wine glass (highlighted by a green box)?\n(A) wine glass\n(B) wine glass" }, { "from": "gpt", "value": "(B) wine glass" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115118_84721832007750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the coffee machine (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896020_138368690951625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897422_104013222602625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897634_139605968942125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chest of drawers (highlighted by a red box) or glass vase (highlighted by a blue box)?\n(A) chest of drawers\n(B) glass vase" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018264_793743073255083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018608_633250507116791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table lamp (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table lamp\n(B) chair" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663347_91448103623875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, pillow (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) pillow\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669939_15262942207000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, houseplant (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) houseplant\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115336_2188055371833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the shelf (highlighted by a red box)? desktop computer (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) desktop computer\n(B) cabinetry" }, { "from": "gpt", "value": "(A) desktop computer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261598_52918406398458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, lamp (highlighted by a red box) or entertainment center (highlighted by a blue box)?\n(A) lamp\n(B) entertainment center" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899630_229889268413875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, curtain (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) curtain\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333119_114289352289666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the door (highlighted by a red box)? Choose among these: window (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) window\n(B) lamp" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358410_40662683172500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from gas stove (highlighted by a red box)? wok (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) wok\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331542_6910908896750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chest of drawers (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) chest of drawers\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899936_863383280025583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to postcard (highlighted by a red box), postcard (highlighted by a blue box) or box (highlighted by a green box)?\n(A) postcard\n(B) box" }, { "from": "gpt", "value": "(A) postcard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895448_129533990594541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, flower (highlighted by a red box) or knob (highlighted by a blue box)?\n(A) flower\n(B) knob" }, { "from": "gpt", "value": "(B) knob" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895478_134565717902333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toy (highlighted by a red box) or mattress (highlighted by a blue box)?\n(A) toy\n(B) mattress" }, { "from": "gpt", "value": "(B) mattress" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261167_1362265227958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018552_830379426801583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or door (highlighted by a blue box)?\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204390_23058885487250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from chair (highlighted by a red box)? dresser (highlighted by a blue box) or desk (highlighted by a green box)?\n(A) dresser\n(B) desk" }, { "from": "gpt", "value": "(A) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018758_14985349664000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) window\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796579_16810163752833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chest of drawers (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) chest of drawers\n(B) sink" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895571_1153740433020291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from footwear (highlighted by a red box)? clothing (highlighted by a blue box) or person (highlighted by a green box)?\n(A) clothing\n(B) person" }, { "from": "gpt", "value": "(B) person" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896482_23889818753916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of chair (annotated by the red box) in relation to radiator?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261502_42606371133166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from chest of drawers (highlighted by a red box)? bed (highlighted by a blue box) or wall clock (highlighted by a green box)?\n(A) bed\n(B) wall clock" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333657_130175776239875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chest of drawers (highlighted by a red box)? sport equipment (highlighted by a blue box) or bed (highlighted by a green box)?\n(A) sport equipment\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670074_38634506209916_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204449_23008973412791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, file cabinet (highlighted by a red box) or drawer (highlighted by a blue box)?\n(A) file cabinet\n(B) drawer" }, { "from": "gpt", "value": "(A) file cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429764_358118643092250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window (highlighted by a red box) or floral arrangement (highlighted by a blue box)?\n(A) window\n(B) floral arrangement" }, { "from": "gpt", "value": "(B) floral arrangement" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358238_10450926853041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhere is light fixture (annotated by the red box) located in relation to shower in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828486_100942454187583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) chair\n(B) radiator" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458447_117498592314791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or coffee machine (highlighted by a blue box)?\n(A) cabinetry\n(B) coffee machine" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649474_14623236088625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chest of drawers (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) chest of drawers\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663332_77461160185458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, curtain (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) curtain\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333493_62565690899041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cabinetry (highlighted by a red box) or countertop (highlighted by a blue box)?\n(A) cabinetry\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331003_178733120241208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, pillow (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) pillow\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444750_79642466728083_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332044_207163384524583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: bar stool (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) bar stool\n(B) bottle" }, { "from": "gpt", "value": "(A) bar stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895279_79211912121875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from kitchen appliance (highlighted by a red box)? Choose from gas stove (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) gas stove\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261392_27857761555083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to lamp (highlighted by a red box)? Choose from table (highlighted by a blue box) and studio couch (highlighted by a green box).\n(A) table\n(B) studio couch" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429841_11913266038041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from microwave oven (highlighted by a red box)? document (highlighted by a blue box) or toy (highlighted by a green box)?\n(A) document\n(B) toy" }, { "from": "gpt", "value": "(A) document" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662870_14590368404291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, paper towel (highlighted by a red box) or material (highlighted by a blue box)?\n(A) paper towel\n(B) material" }, { "from": "gpt", "value": "(A) paper towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331343_192405414388458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, speaker (highlighted by a red box) or television (highlighted by a blue box)?\n(A) speaker\n(B) television" }, { "from": "gpt", "value": "(A) speaker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332398_401559404185666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from pillow (highlighted by a red box)? Choose among these: table lamp (highlighted by a blue box) or light fixture (highlighted by a green box).\n(A) table lamp\n(B) light fixture" }, { "from": "gpt", "value": "(B) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354685032368125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from furniture (highlighted by a red box)? garbage (highlighted by a blue box) or speaker (highlighted by a green box)?\n(A) garbage\n(B) speaker" }, { "from": "gpt", "value": "(A) garbage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333988_50380985215541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window (highlighted by a red box)? Select from curtain (highlighted by a blue box) and shelf (highlighted by a green box).\n(A) curtain\n(B) shelf" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446495_357746527302041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, doormat (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) doormat\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670001_29821666016000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window (highlighted by a red box) or door (highlighted by a blue box)?\n(A) window\n(B) door" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445781_66634482278625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, bathtub (highlighted by a red box) or toothpaste (highlighted by a blue box)?\n(A) bathtub\n(B) toothpaste" }, { "from": "gpt", "value": "(B) toothpaste" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446466_355450459320750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, vase (highlighted by a red box) or writing desk (highlighted by a blue box)?\n(A) vase\n(B) writing desk" }, { "from": "gpt", "value": "(A) vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897436_104952931400500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, door (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) door\n(B) picture frame" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897583_134858244672708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, gas stove (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) gas stove\n(B) ceramic tile" }, { "from": "gpt", "value": "(B) ceramic tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430294_187666460316750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331909_627478479165291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the shelf (highlighted by a red box)? Choose among these: curtain (highlighted by a blue box) or window (highlighted by a green box).\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895576_1155376538811625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to toiletry (highlighted by a red box), bath (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) bath\n(B) curtain" }, { "from": "gpt", "value": "(A) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333111_108673680335833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445848_69403462661916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bottle (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) bottle\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334867_620711924993041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from silverware (highlighted by a red box)? cabinetry (highlighted by a blue box) or silverware (highlighted by a green box)?\n(A) cabinetry\n(B) silverware" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649399_9703854997666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, nightstand (highlighted by a red box) or blanket (highlighted by a blue box)?\n(A) nightstand\n(B) blanket" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669878_10508343858208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from vase (highlighted by a red box), shelf (highlighted by a blue box) or vase (highlighted by a green box)?\n(A) shelf\n(B) vase" }, { "from": "gpt", "value": "(B) vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204828_28533622692833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, door (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) door\n(B) cabinetry" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897655_147141770528625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24850501467125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from light fixture (highlighted by a red box)? dog (highlighted by a blue box) or dog (highlighted by a green box)?\n(A) dog\n(B) dog" }, { "from": "gpt", "value": "(B) dog" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897757_117841212411125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from book (highlighted by a red box)? Choose among these: furniture (highlighted by a blue box) or book (highlighted by a green box).\n(A) furniture\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897939_351261217849458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, electric outlet (highlighted by a red box) or window (highlighted by a blue box)?\n(A) electric outlet\n(B) window" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333618_76287437925833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from cabinetry (highlighted by a red box)? Choose among these: bottle (highlighted by a blue box) or silver (highlighted by a green box).\n(A) bottle\n(B) silver" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649775_43390299933333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from dresser (highlighted by a red box)? Choose from chair (highlighted by a blue box) and furniture (highlighted by a green box).\n(A) chair\n(B) furniture" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445169_7889220909208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from countertop (highlighted by a red box)? lamp (highlighted by a blue box) or microwave oven (highlighted by a green box)?\n(A) lamp\n(B) microwave oven" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899650_233743082784791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the furniture (highlighted by a red box)? picture frame (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446446_82500120121833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, studio couch (highlighted by a red box) or coffee table (highlighted by a blue box)?\n(A) studio couch\n(B) coffee table" }, { "from": "gpt", "value": "(B) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261406_29818795767708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from office supplies (highlighted by a red box)? desk (highlighted by a blue box) or television (highlighted by a green box)?\n(A) desk\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430745_336471733638666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, curtain (highlighted by a red box) or window (highlighted by a blue box)?\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331084_133946992833375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from paperback book (highlighted by a red box)? Select from person (highlighted by a blue box) and paperback book (highlighted by a green box).\n(A) person\n(B) paperback book" }, { "from": "gpt", "value": "(A) person" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899900_1026976031733833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to pillow (highlighted by a red box)? table (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649451_12733240818500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) table\n(B) bottle" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796191_488722703833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of footwear (annotated by the red box) in reference to astronaut? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828243_81923384255750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to curtain (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) cabinetry\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896187_141905121169541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the clothing (highlighted by a red box)? helmet (highlighted by a blue box) or storage box (highlighted by a green box).\n(A) helmet\n(B) storage box" }, { "from": "gpt", "value": "(A) helmet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115143_87038475386833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: window (highlighted by a blue box) or table (highlighted by a green box).\n(A) window\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663065_38321999181916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cabinetry (highlighted by a red box)? tap (highlighted by a blue box) or window (highlighted by a green box)?\n(A) tap\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018899_655437077302375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, mat (highlighted by a red box) or speaker (highlighted by a blue box)?\n(A) mat\n(B) speaker" }, { "from": "gpt", "value": "(B) speaker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204342_14939703565166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, power outlet (highlighted by a red box) or picnic basket (highlighted by a blue box)?\n(A) power outlet\n(B) picnic basket" }, { "from": "gpt", "value": "(B) picnic basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430150_50842706616333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bookcase (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261230_13389319252458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from door (highlighted by a red box), door (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) door\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897643_146898185549333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bowl (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) bowl\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458311_101642582728875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, television (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) television\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898541_180980753828625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, computer desk (highlighted by a red box) or bulletin board (highlighted by a blue box)?\n(A) computer desk\n(B) bulletin board" }, { "from": "gpt", "value": "(A) computer desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662956_24289022817500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table lamp (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) table lamp\n(B) curtain" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828476_100647060025083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from wine glass (highlighted by a red box)? Select from shelf (highlighted by a blue box) and tableware (highlighted by a green box).\n(A) shelf\n(B) tableware" }, { "from": "gpt", "value": "(B) tableware" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429822_744674690989458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is studio couch (annotated by the red box) located relative to table?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895793_680550596639916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, plant (highlighted by a red box) or door (highlighted by a blue box)?\n(A) plant\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898254_696666041075416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, shelf (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) shelf\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115283_118314735970250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to cabinetry (highlighted by a red box)? Select from stool (highlighted by a blue box) and bean bag chair (highlighted by a green box).\n(A) stool\n(B) bean bag chair" }, { "from": "gpt", "value": "(A) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662959_24579489771041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, furniture (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) furniture\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649775_43368308628166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the chest of drawers (highlighted by a red box)? Choose among these: swivel chair (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) swivel chair\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896160_139946075188374_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, soap (highlighted by a red box) or toothbrush (highlighted by a blue box)?\n(A) soap\n(B) toothbrush" }, { "from": "gpt", "value": "(B) toothbrush" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670184_51633744519416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to window (highlighted by a red box)? Select from curtain (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) curtain\n(B) pillow" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458455_118186235295875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cabinetry (highlighted by a red box)? pillow (highlighted by a blue box) or window (highlighted by a green box)?\n(A) pillow\n(B) window" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669874_10430241413250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from cupboard (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or washing machine (highlighted by a green box).\n(A) cabinetry\n(B) washing machine" }, { "from": "gpt", "value": "(B) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204291_14490100701541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from appliance (highlighted by a red box)? Choose among these: counter top (highlighted by a blue box) or kitchen appliance (highlighted by a green box).\n(A) counter top\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796684_30788947880333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to picnic basket (highlighted by a red box)? Choose from clothe (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) clothe\n(B) screen door" }, { "from": "gpt", "value": "(A) clothe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447216_212547009609958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from home appliance (highlighted by a red box), cabinetry (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) cabinetry\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429758_356954659198500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from door (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896177_141342731538291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, glass door (highlighted by a red box) or round table (highlighted by a blue box)?\n(A) glass door\n(B) round table" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458572_266171923666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from jug (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or kitchen appliance (highlighted by a green box).\n(A) cabinetry\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896063_131996988040458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bottle (highlighted by a red box) or bulletin board (highlighted by a blue box)?\n(A) bottle\n(B) bulletin board" }, { "from": "gpt", "value": "(B) bulletin board" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897436_104946933886666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, screen door (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) screen door\n(B) electric outlet" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334966_669413082233625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from window (highlighted by a red box)? Choose among these: window screen (highlighted by a blue box) or radiator (highlighted by a green box).\n(A) window screen\n(B) radiator" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018817_20105040490208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of door (annotated by the red box) in reference to door?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895635_471901691508916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the shelf (highlighted by a red box)? Choose among these: houseplant (highlighted by a blue box) or book (highlighted by a green box).\n(A) houseplant\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669881_10916910510666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the shelf (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) cabinetry\n(B) electric outlet" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333117_114378649310750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, home appliance (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) home appliance\n(B) counter top" }, { "from": "gpt", "value": "(B) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663065_38318000764375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bookcase (highlighted by a red box) or book (highlighted by a blue box)?\n(A) bookcase\n(B) book" }, { "from": "gpt", "value": "(A) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898203_145863369072166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) chair\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331711_11299310469958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is lamp (annotated by the red box) located in relation to window in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739315_44739910076708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to centerpiece (highlighted by a red box), couch (highlighted by a blue box) or remote (highlighted by a green box)?\n(A) couch\n(B) remote" }, { "from": "gpt", "value": "(B) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663415_95862669496416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from table (highlighted by a red box), picture frame (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333293_26489637544708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, wool (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) wool\n(B) bath towel" }, { "from": "gpt", "value": "(A) wool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331938_164873021879458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or flowerpot (highlighted by a blue box)?\n(A) door\n(B) flowerpot" }, { "from": "gpt", "value": "(B) flowerpot" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115158_87630979239125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, electric outlet (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) electric outlet\n(B) window screen" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739814_15611643183666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bathtub (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) bathtub\n(B) tap" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670186_51568938102083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, curtain (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) curtain\n(B) radiator" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204786_27361573411375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from book (highlighted by a red box)? desk (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) desk\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331480_150986534064500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, exhaust hood (highlighted by a red box) or drawer (highlighted by a blue box)?\n(A) exhaust hood\n(B) drawer" }, { "from": "gpt", "value": "(B) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334834_613826764390333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), studio couch (highlighted by a blue box) or mat (highlighted by a green box)?\n(A) studio couch\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332759_43360225180708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to mouthwash (highlighted by a red box)? Select from toiletry (highlighted by a blue box) and toiletry (highlighted by a green box).\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332618_365598282624333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table lamp (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) table lamp\n(B) armchair" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261314_22271942025250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, desk (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) desk\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899559_199460702179666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, door (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) door\n(B) furniture" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331935_163826697013166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cardboard box (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) cardboard box\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331796_10314004514500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bidet (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) bidet\n(B) basket" }, { "from": "gpt", "value": "(A) bidet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796750_29680359449791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, furniture (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) furniture\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899913_1028307547950791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from screen door (highlighted by a red box)? Choose from trash bin/can (highlighted by a blue box) and tap (highlighted by a green box).\n(A) trash bin/can\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115205_95213836200083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cabinetry (highlighted by a red box) or bowl (highlighted by a blue box)?\n(A) cabinetry\n(B) bowl" }, { "from": "gpt", "value": "(B) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430439_1064447782455_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bottle (highlighted by a red box) or grapefruit (highlighted by a blue box)?\n(A) bottle\n(B) grapefruit" }, { "from": "gpt", "value": "(B) grapefruit" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358162_60958730556708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to picture frame (highlighted by a red box)? Choose from mirror (highlighted by a blue box) and vanity (highlighted by a green box).\n(A) mirror\n(B) vanity" }, { "from": "gpt", "value": "(B) vanity" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332467_886392766398708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from window sill (highlighted by a red box)? Choose from window (highlighted by a blue box) and refrigerator (highlighted by a green box).\n(A) window\n(B) refrigerator" }, { "from": "gpt", "value": "(B) refrigerator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261455_35761454626916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from picture frame (highlighted by a red box)? shelf (highlighted by a blue box) or television (highlighted by a green box)?\n(A) shelf\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431082_75468128672916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to storage box (highlighted by a red box), storage box (highlighted by a blue box) or storage box (highlighted by a green box)?\n(A) storage box\n(B) storage box" }, { "from": "gpt", "value": "(B) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018087_104061921207166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the mouthwash (highlighted by a red box)? cleaning product (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) cleaning product\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115244_97698784455083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from table (highlighted by a red box)? Choose from light fixture (highlighted by a blue box) and television (highlighted by a green box).\n(A) light fixture\n(B) television" }, { "from": "gpt", "value": "(A) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204861_2667753949166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from window screen (highlighted by a red box)? bay window (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) bay window\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334058_86096486143041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from chair (highlighted by a red box)? Choose among these: radiator (highlighted by a blue box) or speaker (highlighted by a green box).\n(A) radiator\n(B) speaker" }, { "from": "gpt", "value": "(B) speaker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737886522722625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898248_167851026912625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window screen (highlighted by a red box), curtain (highlighted by a blue box) or nightstand (highlighted by a green box)?\n(A) curtain\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018608_633214521846208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cabinetry (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) cabinetry\n(B) bottle" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670334_66380191875499_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, clock (highlighted by a red box) or fruit (highlighted by a blue box)?\n(A) clock\n(B) fruit" }, { "from": "gpt", "value": "(A) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899600_202581738548083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to pillow (highlighted by a red box)? Select from nightstand (highlighted by a blue box) and table lamp (highlighted by a green box).\n(A) nightstand\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358230_10094562428500_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828150_73448099237791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is furniture (annotated by the red box) located relative to step stool? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204585_574521992250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, footwear (highlighted by a red box) or door (highlighted by a blue box)?\n(A) footwear\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204505_898766116875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, microwave oven (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) microwave oven\n(B) appliance" }, { "from": "gpt", "value": "(A) microwave oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445103_9228484556375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the curtain (highlighted by a red box)? Choose among these: poster (highlighted by a blue box) or door (highlighted by a green box).\n(A) poster\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429762_356819947315166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to material (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and blanket (highlighted by a green box).\n(A) furniture\n(B) blanket" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429804_737631825485666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, wine rack (highlighted by a red box) or table (highlighted by a blue box)?\n(A) wine rack\n(B) table" }, { "from": "gpt", "value": "(A) wine rack" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260951_6083893193375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to chair (highlighted by a red box), picture frame (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) picture frame\n(B) curtain" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354813029920208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to mirror (highlighted by a red box)? Select from table (highlighted by a blue box) and furniture (highlighted by a green box).\n(A) table\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358112_61751598853583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) table\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897804_131412410885249_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from box (highlighted by a red box)? Choose among these: desktop computer (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) desktop computer\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430966_99503363180125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, door (highlighted by a red box) or power plugs and sockets (highlighted by a blue box)?\n(A) door\n(B) power plugs and sockets" }, { "from": "gpt", "value": "(B) power plugs and sockets" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669959_27856897731375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to cabinetry (highlighted by a red box)? Choose from window (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) window\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333153_41544319346000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, blanket (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) blanket\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670008_30413586066083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to furniture (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and window sill (highlighted by a green box).\n(A) picture frame\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334783_426522978324958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to elevator door (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and door (highlighted by a green box).\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471537821318583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, plate (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) plate\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204535_2210334363333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, equipment (highlighted by a red box) or table (highlighted by a blue box)?\n(A) equipment\n(B) table" }, { "from": "gpt", "value": "(A) equipment" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018697_544877141035540_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or cloth (highlighted by a blue box)?\n(A) table\n(B) cloth" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445670_60956706831750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from curtain (highlighted by a red box)? Choose from studio couch (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) studio couch\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899034_643226918370541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from studio couch (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) pillow\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446576_205903443247166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, throw pillow (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) throw pillow\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895987_136420107610750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663377_92427698141166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table lamp (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) table lamp\n(B) studio couch" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358167_60817936345791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from television (highlighted by a red box)? Choose among these: studio couch (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) studio couch\n(B) picture frame" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333115_114240955255375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the screen door (highlighted by a red box)? Choose among these: radiator (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) radiator\n(B) curtain" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669959_27742095445708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the home appliance (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or swivel chair (highlighted by a green box).\n(A) cabinetry\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896083_144067891787666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from oven (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739574_198414255873666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) window\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331479_150943134942500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or postcard (highlighted by a blue box)?\n(A) door\n(B) postcard" }, { "from": "gpt", "value": "(B) postcard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458262_74215145933416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, shelf (highlighted by a red box) or storage box (highlighted by a blue box)?\n(A) shelf\n(B) storage box" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115299_119603134547125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, candle holder (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) candle holder\n(B) doormat" }, { "from": "gpt", "value": "(B) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898530_181106753988333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to furniture (highlighted by a red box), door (highlighted by a blue box) or stairwell (highlighted by a green box)?\n(A) door\n(B) stairwell" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204724_23498513874833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from curtain (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or chair (highlighted by a green box).\n(A) picture frame\n(B) chair" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896512_33416272632375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to mat (highlighted by a red box), yoga mat (highlighted by a blue box) or table (highlighted by a green box)?\n(A) yoga mat\n(B) table" }, { "from": "gpt", "value": "(A) yoga mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796722_27558982257958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from handbag (highlighted by a red box), desk (highlighted by a blue box) or window screen (highlighted by a green box)?\n(A) desk\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115287_118063935138958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, furniture (highlighted by a red box) or door (highlighted by a blue box)?\n(A) furniture\n(B) door" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895863_107846159702708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, furniture (highlighted by a red box) or picnic basket (highlighted by a blue box)?\n(A) furniture\n(B) picnic basket" }, { "from": "gpt", "value": "(B) picnic basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445462_151060629051166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445938_79450567347708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, toy (highlighted by a red box) or couch (highlighted by a blue box)?\n(A) toy\n(B) couch" }, { "from": "gpt", "value": "(B) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895184_37797479596333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) picture frame\n(B) furniture" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47330995_176949691957916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, laptop (highlighted by a red box) or swivel chair (highlighted by a blue box)?\n(A) laptop\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331918_629170791875166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, electric outlet (highlighted by a red box) or plug (highlighted by a blue box)?\n(A) electric outlet\n(B) plug" }, { "from": "gpt", "value": "(B) plug" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445680_62048365598250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the table (highlighted by a red box)? Choose among these: toy (highlighted by a blue box) or chair (highlighted by a green box).\n(A) toy\n(B) chair" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334837_613741249034500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, floral arrangement (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) floral arrangement\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018149_372820794116666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to picture frame (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358253_6165041501125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), pillow (highlighted by a blue box) or stripe (highlighted by a green box)?\n(A) pillow\n(B) stripe" }, { "from": "gpt", "value": "(B) stripe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447294_408996909897083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, food (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) food\n(B) basket" }, { "from": "gpt", "value": "(A) food" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358238_10446911848833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from gray (highlighted by a red box)? Choose from mirror (highlighted by a blue box) and balustrade (highlighted by a green box).\n(A) mirror\n(B) balustrade" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444925_220821653185083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or air conditioning (highlighted by a blue box)?\n(A) curtain\n(B) air conditioning" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430097_28750871965791_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333801_51133550624583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, houseplant (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) houseplant\n(B) radiator" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899285_885253566069333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, screen door (highlighted by a red box) or water heater (highlighted by a blue box)?\n(A) screen door\n(B) water heater" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332320_390796770386041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from appliance (highlighted by a red box)? refrigerator (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) refrigerator\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445834_68153685143958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, material (highlighted by a red box) or food (highlighted by a blue box)?\n(A) material\n(B) food" }, { "from": "gpt", "value": "(A) material" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017890_81017945799125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from appliance (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or kitchen appliance (highlighted by a green box).\n(A) appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739690_1104143119625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) chair\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663250_75010275142875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the glass vase (highlighted by a red box)? Choose among these: cupboard (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) cupboard\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204329_14345615709000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table (highlighted by a red box) or mirror (highlighted by a blue box)?\n(A) table\n(B) mirror" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334713_533810578503750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, laptop (highlighted by a red box) or stationery (highlighted by a blue box)?\n(A) laptop\n(B) stationery" }, { "from": "gpt", "value": "(B) stationery" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897728_114203534612583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, bookcase (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) bookcase\n(B) curtain" }, { "from": "gpt", "value": "(A) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670158_40768129642416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from coffeepot (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or coffeepot (highlighted by a green box).\n(A) picture frame\n(B) coffeepot" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895469_132847910956415_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, houseplant (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458329_102821623342333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to radiator (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and television (highlighted by a green box).\n(A) picture frame\n(B) television" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358176_62241631556208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to pillow (highlighted by a red box), table (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) table\n(B) lamp" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261541_74287734098750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, toy (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) toy\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649474_14653240864000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from pillow (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or swivel chair (highlighted by a green box).\n(A) chair\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899483_955299522072791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, train window (highlighted by a red box) or flyer (highlighted by a blue box)?\n(A) train window\n(B) flyer" }, { "from": "gpt", "value": "(B) flyer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261600_52976899916541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, radiator (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) radiator\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430127_32640746838500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from door (highlighted by a red box)? Select from laundry (highlighted by a blue box) and sink (highlighted by a green box).\n(A) laundry\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332746_42476419589833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from picture frame (highlighted by a red box)? curtain (highlighted by a blue box) or bulletin board (highlighted by a green box)?\n(A) curtain\n(B) bulletin board" }, { "from": "gpt", "value": "(B) bulletin board" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331028_474680321979916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from table (highlighted by a red box), table (highlighted by a blue box) or flowerpot (highlighted by a green box)?\n(A) table\n(B) flowerpot" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663064_38426491192916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the loudspeaker (highlighted by a red box)? desk (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) desk\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897722_114308640915041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, electric outlet (highlighted by a red box) or picnic basket (highlighted by a blue box)?\n(A) electric outlet\n(B) picnic basket" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332587_360578445802333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, houseplant (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) houseplant\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331091_134663013390208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from car (highlighted by a red box)? Choose among these: toy (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) toy\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899043_645742110965125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from appliance (highlighted by a red box), countertop (highlighted by a blue box) or plate (highlighted by a green box)?\n(A) countertop\n(B) plate" }, { "from": "gpt", "value": "(B) plate" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796446_609714134416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from radiator (highlighted by a red box)? Select from armoire (highlighted by a blue box) and nightstand (highlighted by a green box).\n(A) armoire\n(B) nightstand" }, { "from": "gpt", "value": "(A) armoire" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649425_10752914637833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895833_1221751720932375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446444_82643013588458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to christmas tree (highlighted by a red box)? Choose from animal (highlighted by a blue box) and desk (highlighted by a green box).\n(A) animal\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018800_18818194440750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from table (highlighted by a red box)? Select from door (highlighted by a blue box) and door (highlighted by a green box).\n(A) door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333801_51151543341708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from paper towel (highlighted by a red box)? book (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) book\n(B) chair" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115394_3421267863000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from coffee machine (highlighted by a red box)? Choose from countertop (highlighted by a blue box) and home appliance (highlighted by a green box).\n(A) countertop\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670197_53486704932416_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358380_18918840198541_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from pillow (highlighted by a red box)? Select from pillow (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) pillow\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447226_212390423978625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, shelf (highlighted by a red box) or beach towel (highlighted by a blue box)?\n(A) shelf\n(B) beach towel" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358624_435705316291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from clothing (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896522_34700321087625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to bottle (highlighted by a red box)? bottle (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) bottle\n(B) lamp" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670073_38450216062541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window (highlighted by a red box), music stool (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) music stool\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260946_4715896119500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from book (highlighted by a red box), picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331909_627464484794625_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897643_146930172659291_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897756_117706518311291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, lamp (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663044_36123467624208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bay window (highlighted by a red box) or window frame (highlighted by a blue box)?\n(A) bay window\n(B) window frame" }, { "from": "gpt", "value": "(B) window frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445707_63790604926625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334222_107099214187791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from stationery (highlighted by a red box)? Select from stationery (highlighted by a blue box) and toy (highlighted by a green box).\n(A) stationery\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204305_15348270263125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895614_470417098985625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toilet paper (highlighted by a red box) or soap (highlighted by a blue box)?\n(A) toilet paper\n(B) soap" }, { "from": "gpt", "value": "(B) soap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331143_177732640722583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the toilet paper (highlighted by a red box)? toilet paper (highlighted by a blue box) or mouthwash (highlighted by a green box).\n(A) toilet paper\n(B) mouthwash" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331091_134655016637291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, pillow (highlighted by a red box) or dog (highlighted by a blue box)?\n(A) pillow\n(B) dog" }, { "from": "gpt", "value": "(B) dog" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333056_60189581383125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, electric outlet (highlighted by a red box) or book (highlighted by a blue box)?\n(A) electric outlet\n(B) book" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334615_385645622023916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or trash bin/can (highlighted by a blue box)?\n(A) chair\n(B) trash bin/can" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828486_100888443288833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, stool (highlighted by a red box) or stool (highlighted by a blue box)?\n(A) stool\n(B) stool" }, { "from": "gpt", "value": "(A) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898261_696821027316916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or speaker (highlighted by a blue box)?\n(A) picture frame\n(B) speaker" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670356_67365486423416_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649680_35515024756416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, sink (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) sink\n(B) screen door" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899630_229915274723166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to coffee table (highlighted by a red box), book (highlighted by a blue box) or magazine (highlighted by a green box)?\n(A) book\n(B) magazine" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896089_143944093046000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, laptop (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) laptop\n(B) cabinetry" }, { "from": "gpt", "value": "(A) laptop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358167_60891940323000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from pillow (highlighted by a red box)? furniture (highlighted by a blue box) or screen door (highlighted by a green box)?\n(A) furniture\n(B) screen door" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24498512711708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to bookshelf (highlighted by a red box)? studio couch (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430931_92905383314916_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261556_75638876273916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from toy (highlighted by a red box)? shelf (highlighted by a blue box) or door (highlighted by a green box)?\n(A) shelf\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115424_4945408719375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from mirror (highlighted by a red box), window sill (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) window sill\n(B) appliance" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333674_134191753141500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, book (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) book\n(B) paperback book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333803_51546849440208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115628_3415096697916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or table (highlighted by a blue box)?\n(A) door\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739629_1975671263083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, book (highlighted by a red box) or plain (highlighted by a blue box)?\n(A) book\n(B) plain" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445128_5124229430208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, curtain (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) curtain\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444499_2458914221666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to picture frame (highlighted by a red box)? Select from window (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) window\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669876_10391340130875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the home appliance (highlighted by a red box)? laundry (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) laundry\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649603_36065598026250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from screen door (highlighted by a red box)? Choose from chair (highlighted by a blue box) and book (highlighted by a green box).\n(A) chair\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669876_10393339340416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, footwear (highlighted by a red box) or shoe (highlighted by a blue box)?\n(A) footwear\n(B) shoe" }, { "from": "gpt", "value": "(A) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895864_489596271609041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window (highlighted by a red box) or wall clock (highlighted by a blue box)?\n(A) window\n(B) wall clock" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898510_160697687256083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from picture frame (highlighted by a red box)? chest of drawers (highlighted by a blue box) or vanity (highlighted by a green box)?\n(A) chest of drawers\n(B) vanity" }, { "from": "gpt", "value": "(B) vanity" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899663_234377473355000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window frame (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) window frame\n(B) screen door" }, { "from": "gpt", "value": "(A) window frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895633_471724097267083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, computer (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) computer\n(B) home appliance" }, { "from": "gpt", "value": "(A) computer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896490_31606345490541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from shelf (highlighted by a red box)? Choose among these: cleaning product (highlighted by a blue box) or mouthwash (highlighted by a green box).\n(A) cleaning product\n(B) mouthwash" }, { "from": "gpt", "value": "(B) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334879_621754808024125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of window (annotated by the red box) in reference to curtain? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796366_10602442449750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430410_127204300673083_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446446_82364107279666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to appliance (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and drawer (highlighted by a green box).\n(A) cabinetry\n(B) drawer" }, { "from": "gpt", "value": "(B) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333463_57268571789375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) picture frame\n(B) shelf" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669960_27627093106500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to cabinetry (highlighted by a red box), chair (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331041_479806718822208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table (highlighted by a red box) or fruit (highlighted by a blue box)?\n(A) table\n(B) fruit" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331154_181632712129333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, kitchen appliance (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) kitchen appliance\n(B) home appliance" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896121_145919123347375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the window (highlighted by a red box)? Choose among these: robe (highlighted by a blue box) or glass door (highlighted by a green box).\n(A) robe\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898959_821207691602958_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895199_39508113396250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or coffee table (highlighted by a blue box)?\n(A) chair\n(B) coffee table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332383_398658528706000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, shelf (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) shelf\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796507_3193609797666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from coffee cup (highlighted by a red box)? fireplace (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) fireplace\n(B) picture frame" }, { "from": "gpt", "value": "(A) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897709_111996301442250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) chair\n(B) armchair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261677_3059553042708_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) picture frame\n(B) radiator" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895235_73955892464875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, postcard (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) postcard\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739612_200161847628000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from medicine cabinet (highlighted by a red box), toilet paper (highlighted by a blue box) or toiletry (highlighted by a green box)?\n(A) toilet paper\n(B) toiletry" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430401_126680796288833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to sink (highlighted by a red box), cabinetry (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) cabinetry\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895911_111446845819333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, window sill (highlighted by a red box) or window (highlighted by a blue box)?\n(A) window sill\n(B) window" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446446_82390113642333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, bar stool (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) bar stool\n(B) cabinetry" }, { "from": "gpt", "value": "(A) bar stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260890_8702210630875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from mirror (highlighted by a red box)? Choose from toiletry (highlighted by a blue box) and shelf (highlighted by a green box).\n(A) toiletry\n(B) shelf" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331187_278123195453831_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to tap (highlighted by a red box), refrigerator (highlighted by a blue box) or plant (highlighted by a green box)?\n(A) refrigerator\n(B) plant" }, { "from": "gpt", "value": "(B) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261275_14287656450416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to picture frame (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204506_686470839458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, cabinetry (highlighted by a red box) or door (highlighted by a blue box)?\n(A) cabinetry\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897870_529934959607083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, window (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) window\n(B) appliance" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739925_16384067497375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from nightstand (highlighted by a red box)? Select from brush (highlighted by a blue box) and mirror (highlighted by a green box).\n(A) brush\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334163_348187827855583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from curtain (highlighted by a red box), pillow (highlighted by a blue box) or table lamp (highlighted by a green box)?\n(A) pillow\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331211_281170258259125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) chair\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334920_1091067895719666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bathtub (highlighted by a red box) or soap dispenser (highlighted by a blue box)?\n(A) bathtub\n(B) soap dispenser" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828498_101770697680833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, screen door (highlighted by a red box) or washer (highlighted by a blue box)?\n(A) screen door\n(B) washer" }, { "from": "gpt", "value": "(B) washer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447216_212507026071666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the desk (highlighted by a red box)? leftover (highlighted by a blue box) or laundry (highlighted by a green box).\n(A) leftover\n(B) laundry" }, { "from": "gpt", "value": "(A) leftover" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796709_27471083744833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cabinetry (highlighted by a red box)? chair (highlighted by a blue box) or table (highlighted by a green box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331893_623321045771000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of chest of drawers (annotated by the red box) in reference to backpack?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261294_16246839056375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) picture frame\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895298_91159129141916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331508_155181905149708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to door (highlighted by a red box)? Choose from cage (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) cage\n(B) cabinetry" }, { "from": "gpt", "value": "(A) cage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444754_80979158468875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from lamp (highlighted by a red box), control (highlighted by a blue box) or writing (highlighted by a green box)?\n(A) control\n(B) writing" }, { "from": "gpt", "value": "(A) control" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897490_471222818882083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the clock (highlighted by a red box)? window sill (highlighted by a blue box) or clock (highlighted by a green box).\n(A) window sill\n(B) clock" }, { "from": "gpt", "value": "(B) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670044_33337401937458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, lamp (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670234_52918978562916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from sink (highlighted by a red box)? Choose among these: toilet (highlighted by a blue box) or bath (highlighted by a green box).\n(A) toilet\n(B) bath" }, { "from": "gpt", "value": "(B) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444908_106330658071958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to appliance (highlighted by a red box), table (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) table\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358230_10036369906791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, archway (highlighted by a red box) or window (highlighted by a blue box)?\n(A) archway\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899955_865610862726333_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431146_350782672408833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, mirror (highlighted by a red box) or bookcase (highlighted by a blue box)?\n(A) mirror\n(B) bookcase" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663053_38569401320125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the picture frame (highlighted by a red box)? Choose among these: bookcase (highlighted by a blue box) or book (highlighted by a green box).\n(A) bookcase\n(B) book" }, { "from": "gpt", "value": "(A) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204678_12552438472375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to cupboard (highlighted by a red box), book (highlighted by a blue box) or radiator (highlighted by a green box)?\n(A) book\n(B) radiator" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430217_180345211770041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from mat (highlighted by a red box)? chair (highlighted by a blue box) or wide (highlighted by a green box)?\n(A) chair\n(B) wide" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739281_42608767639875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, couch (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) couch\n(B) armchair" }, { "from": "gpt", "value": "(B) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333803_51625150877333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, furniture (highlighted by a red box) or sheet (highlighted by a blue box)?\n(A) furniture\n(B) sheet" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896177_141350745036416_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899271_883775104925625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, porcelain (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) porcelain\n(B) toilet paper" }, { "from": "gpt", "value": "(A) porcelain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332986_124542868672333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from basket (highlighted by a red box), basket (highlighted by a blue box) or material (highlighted by a green box)?\n(A) basket\n(B) material" }, { "from": "gpt", "value": "(B) material" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261522_45826148205583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, mirror (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) mirror\n(B) cabinetry" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897490_471164226479041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, appliance (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) appliance\n(B) home appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429816_744593907364666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, houseplant (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334629_386355139583125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, furniture (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) furniture\n(B) toiletry" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331041_479835024099291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) chair\n(B) shelf" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333031_59046928463625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, couch (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) couch\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796751_29747666166625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739455_51592085281083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cabinetry (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) cabinetry\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663376_92391295876583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, radiator (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) radiator\n(B) studio couch" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447199_87971094846708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to book (highlighted by a red box)? Select from bicycle (highlighted by a blue box) and armchair (highlighted by a green box).\n(A) bicycle\n(B) armchair" }, { "from": "gpt", "value": "(A) bicycle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458506_113198676634041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from studio couch (highlighted by a red box)? Select from pillow (highlighted by a blue box) and window (highlighted by a green box).\n(A) pillow\n(B) window" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115334_2335460997875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, mug (highlighted by a red box) or window blind (highlighted by a blue box)?\n(A) mug\n(B) window blind" }, { "from": "gpt", "value": "(B) window blind" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261252_12838304455666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the desk (highlighted by a red box)? Choose among these: swivel chair (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) swivel chair\n(B) studio couch" }, { "from": "gpt", "value": "(A) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331107_135534978991541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, glass door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) glass door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896527_34776922650875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to apple (highlighted by a red box), shelf (highlighted by a blue box) or bowl (highlighted by a green box)?\n(A) shelf\n(B) bowl" }, { "from": "gpt", "value": "(B) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796358_10455350611500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895482_134693415875665_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, storage box (highlighted by a red box) or box (highlighted by a blue box)?\n(A) storage box\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663065_38371996078083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, studio couch (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) studio couch\n(B) glass door" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897655_147145785571250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is chair (annotated by the red box) located in relation to houseplant in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898625_757793107407875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cleaning product (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) cleaning product\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663226_66748066967666_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429851_12790841435833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to toiletry (highlighted by a red box)? Choose from mouthwash (highlighted by a blue box) and mouthwash (highlighted by a green box).\n(A) mouthwash\n(B) mouthwash" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429871_14215483566250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from shelf (highlighted by a red box)? shelf (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) shelf\n(B) shelf" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669896_11124711585125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to coffee table (highlighted by a red box)? Choose from table (highlighted by a blue box) and studio couch (highlighted by a green box).\n(A) table\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446558_86696972314208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from bowl (highlighted by a red box)? countertop (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) countertop\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896404_16733512909041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331281_14152401712875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332158_260071728003791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or window (highlighted by a blue box)?\n(A) cabinetry\n(B) window" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897757_117857222422875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the pillow (highlighted by a red box)? Choose among these: table (highlighted by a blue box) or chair (highlighted by a green box).\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261228_13800715059291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to basket (highlighted by a red box)? chest of drawers (highlighted by a blue box) or fireplace (highlighted by a green box).\n(A) chest of drawers\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331699_9543424646416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to shelf (highlighted by a red box)? laptop (highlighted by a blue box) or desk (highlighted by a green box).\n(A) laptop\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458262_74137143430041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, curtain (highlighted by a red box) or book (highlighted by a blue box)?\n(A) curtain\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334883_622619699197541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the clock (highlighted by a red box)? blanket (highlighted by a blue box) or chest of drawers (highlighted by a green box).\n(A) blanket\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649633_39553238753291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, gas stove (highlighted by a red box) or oven (highlighted by a blue box)?\n(A) gas stove\n(B) oven" }, { "from": "gpt", "value": "(A) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333603_75471587834333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899202_186836878706875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chest of drawers (highlighted by a red box) or vanity (highlighted by a blue box)?\n(A) chest of drawers\n(B) vanity" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895816_685877442697958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bath (highlighted by a red box)? Select from counter top (highlighted by a blue box) and bath towel (highlighted by a green box).\n(A) counter top\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334066_87381216780000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from mouthwash (highlighted by a red box)? Select from glass door (highlighted by a blue box) and cleaning product (highlighted by a green box).\n(A) glass door\n(B) cleaning product" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662829_15175599634916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from appliance (highlighted by a red box)? Choose among these: countertop (highlighted by a blue box) or kitchen appliance (highlighted by a green box).\n(A) countertop\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897757_117793215677000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, desk (highlighted by a red box) or blanket (highlighted by a blue box)?\n(A) desk\n(B) blanket" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899909_1027536770547750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, furniture (highlighted by a red box) or door (highlighted by a blue box)?\n(A) furniture\n(B) door" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333870_76168077607708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the window sill (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or plant (highlighted by a green box).\n(A) chair\n(B) plant" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895983_407272161647666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) table\n(B) toilet paper" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796584_17413680976500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the picture frame (highlighted by a red box)? Choose among these: bath towel (highlighted by a blue box) or window (highlighted by a green box).\n(A) bath towel\n(B) window" }, { "from": "gpt", "value": "(A) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332201_264248273614124_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, houseplant (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) houseplant\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331298_15004349983875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, glass vase (highlighted by a red box) or glass vase (highlighted by a blue box)?\n(A) glass vase\n(B) glass vase" }, { "from": "gpt", "value": "(A) glass vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899657_234507871671333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) window\n(B) screen door" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444821_56521050320750_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898256_696448030446416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from curtain (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) door\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670201_53331402885416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, furniture (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) furniture\n(B) curtain" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261099_1004855940208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, clock (highlighted by a red box) or vent (highlighted by a blue box)?\n(A) clock\n(B) vent" }, { "from": "gpt", "value": "(B) vent" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458634_127495875810708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to couch (highlighted by a red box)? Choose from table (highlighted by a blue box) and candle holder (highlighted by a green box).\n(A) table\n(B) candle holder" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261241_15075599815833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from shelf (highlighted by a red box), desk (highlighted by a blue box) or book (highlighted by a green box)?\n(A) desk\n(B) book" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458330_103003714374125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, computer chair (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) computer chair\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430269_185661606033708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to book (highlighted by a red box)? toy (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) toy\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018550_830258725896125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the file cabinet (highlighted by a red box)? curtain (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) curtain\n(B) electric outlet" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896551_30216605027416_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896133_147062724355583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to window (highlighted by a red box)? Choose from wall clock (highlighted by a blue box) and lamp (highlighted by a green box).\n(A) wall clock\n(B) lamp" }, { "from": "gpt", "value": "(A) wall clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444822_56653845585000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, lamp (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) lamp\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895614_470413100614583_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898510_160653688818250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from screen door (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or flower (highlighted by a green box).\n(A) door\n(B) flower" }, { "from": "gpt", "value": "(B) flower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430802_61093470315375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, mirror (highlighted by a red box) or table (highlighted by a blue box)?\n(A) mirror\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332624_365543488255166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhere is computer monitor (annotated by the red box) located in relation to window in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358698_3062717896416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, window (highlighted by a red box) or table (highlighted by a blue box)?\n(A) window\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898696_580849685911583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, drawer (highlighted by a red box) or gas stove (highlighted by a blue box)?\n(A) drawer\n(B) gas stove" }, { "from": "gpt", "value": "(A) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333288_25269132494583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or stairwell (highlighted by a blue box)?\n(A) door\n(B) stairwell" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895622_470839845900750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, toiletries (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) toiletries\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796709_27463086911083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to chair (highlighted by a red box), chair (highlighted by a blue box) or pitcher (highlighted by a green box)?\n(A) chair\n(B) pitcher" }, { "from": "gpt", "value": "(B) pitcher" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458337_102894726342416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, studio couch (highlighted by a red box) or baby (highlighted by a blue box)?\n(A) studio couch\n(B) baby" }, { "from": "gpt", "value": "(B) baby" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669854_12655445847166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to toy (highlighted by a red box)? Select from table (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) table\n(B) screen door" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897643_146865881884666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, oven (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) oven\n(B) home appliance" }, { "from": "gpt", "value": "(A) oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896304_6834136511791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115415_4161561776833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the furniture (highlighted by a red box)? wood burning stove (highlighted by a blue box) or doormat (highlighted by a green box).\n(A) wood burning stove\n(B) doormat" }, { "from": "gpt", "value": "(B) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331479_150905133609291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, tap (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) tap\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331520_190680280930375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bottle (highlighted by a red box) or fridge (highlighted by a blue box)?\n(A) bottle\n(B) fridge" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670208_54177665559500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, pillow (highlighted by a red box) or window (highlighted by a blue box)?\n(A) pillow\n(B) window" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444712_73993708884000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from nightstand (highlighted by a red box), electric outlet (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) electric outlet\n(B) lamp" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458569_164980591166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, basket (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) basket\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898349_509459021825291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toilet paper (highlighted by a red box), plumbing fixture (highlighted by a blue box) or toilet (highlighted by a green box)?\n(A) plumbing fixture\n(B) toilet" }, { "from": "gpt", "value": "(B) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018415_394375232878083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, bath towel (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) bath towel\n(B) curtain" }, { "from": "gpt", "value": "(A) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331422_544169026502582_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, blanket (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) blanket\n(B) pillow" }, { "from": "gpt", "value": "(A) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018153_373377673168125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is furniture (annotated by the red box) located relative to furniture? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334171_350615458133208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is electric outlet (annotated by the red box) located in relation to chair in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018817_20109038874083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cardboard box (highlighted by a red box)? Choose among these: washing machine (highlighted by a blue box) or bath towel (highlighted by a green box).\n(A) washing machine\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898384_367784797477875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, curtain (highlighted by a red box) or book (highlighted by a blue box)?\n(A) curtain\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332152_259948028136500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, computer monitor (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) computer monitor\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261381_26858106259000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from window (highlighted by a red box)? Choose from bottle (highlighted by a blue box) and remote control (highlighted by a green box).\n(A) bottle\n(B) remote control" }, { "from": "gpt", "value": "(B) remote control" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431092_76036855078125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) door\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018059_718934726180625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bathroom cabinet (highlighted by a red box) or comic book character (highlighted by a blue box)?\n(A) bathroom cabinet\n(B) comic book character" }, { "from": "gpt", "value": "(A) bathroom cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333670_133947369067666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cabinetry (highlighted by a red box)? Choose from clothing (highlighted by a blue box) and furniture (highlighted by a green box).\n(A) clothing\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895192_38399227378291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toilet paper (highlighted by a red box)? beach towel (highlighted by a blue box) or carton (highlighted by a green box).\n(A) beach towel\n(B) carton" }, { "from": "gpt", "value": "(B) carton" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896351_18766902212416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of studio couch (annotated by the red box) and bean bag chair in the image provided, where is studio couch (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018846_649927709256458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the electric outlet (highlighted by a red box)? Choose among these: curtain (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) curtain\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334027_273664508384958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cardboard box (highlighted by a red box)? Choose from table (highlighted by a blue box) and cardboard box (highlighted by a green box).\n(A) table\n(B) cardboard box" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898212_145952382099625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from armchair (highlighted by a red box)? Select from chair (highlighted by a blue box) and armchair (highlighted by a green box).\n(A) chair\n(B) armchair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204305_15147270604791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or cupboard (highlighted by a blue box)?\n(A) picture frame\n(B) cupboard" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261339_23963546090458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from kitchen appliance (highlighted by a red box), kitchen appliance (highlighted by a blue box) or bar stool (highlighted by a green box)?\n(A) kitchen appliance\n(B) bar stool" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895895_109476120672708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from tap (highlighted by a red box), screen door (highlighted by a blue box) or sink (highlighted by a green box)?\n(A) screen door\n(B) sink" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331273_12963048694208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) table\n(B) toy" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898729_583552569055500_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358647_2939843052125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from window (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444767_81450876772041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, mattress (highlighted by a red box) or bedside lamp (highlighted by a blue box)?\n(A) mattress\n(B) bedside lamp" }, { "from": "gpt", "value": "(A) mattress" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895633_471787504778291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from television (highlighted by a red box)? book (highlighted by a blue box) or bookcase (highlighted by a green box)?\n(A) book\n(B) bookcase" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018889_654984087549250_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331040_479756922190791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the chair (highlighted by a red box)? bar stool (highlighted by a blue box) or table (highlighted by a green box).\n(A) bar stool\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796216_1954229259750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from toilet paper (highlighted by a red box)? Choose among these: curtain (highlighted by a blue box) or bathroom cabinet (highlighted by a green box).\n(A) curtain\n(B) bathroom cabinet" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444872_98060177651291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670195_53378599956541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333674_134161365502666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, furniture (highlighted by a red box) or blanket (highlighted by a blue box)?\n(A) furniture\n(B) blanket" }, { "from": "gpt", "value": "(B) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331922_630793795628708_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670271_66592417447165_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) door\n(B) doormat" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897434_104185217788666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) picture frame\n(B) radiator" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446131_141096365599458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, furniture (highlighted by a red box) or computer monitor (highlighted by a blue box)?\n(A) furniture\n(B) computer monitor" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897712_112019291849916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, tray (highlighted by a red box) or food (highlighted by a blue box)?\n(A) tray\n(B) food" }, { "from": "gpt", "value": "(A) tray" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115362_816070058166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to pillow (highlighted by a red box)? Select from cat bed (highlighted by a blue box) and tripod (highlighted by a green box).\n(A) cat bed\n(B) tripod" }, { "from": "gpt", "value": "(B) tripod" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669917_14112260701750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from picture frame (highlighted by a red box), picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899285_885249567727375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or corridor (highlighted by a blue box)?\n(A) door\n(B) corridor" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897712_112125297557250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, waste container (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) waste container\n(B) ceramic tile" }, { "from": "gpt", "value": "(B) ceramic tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334627_386299845384333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of vanity (annotated by the red box) and toilet paper in the image provided, where is vanity (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018307_109090177704458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or swivel chair (highlighted by a blue box)?\n(A) chair\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261344_24293548930083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, desk (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) desk\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649743_49721894894833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from computer keyboard (highlighted by a red box)? computer monitor (highlighted by a blue box) or computer monitor (highlighted by a green box)?\n(A) computer monitor\n(B) computer monitor" }, { "from": "gpt", "value": "(B) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204622_11889745768416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, drawer (highlighted by a red box) or table (highlighted by a blue box)?\n(A) drawer\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445691_57463381898708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, box (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) box\n(B) footwear" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358386_19244743937875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018785_18220439033541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from window screen (highlighted by a red box)? Choose from screen door (highlighted by a blue box) and window sill (highlighted by a green box).\n(A) screen door\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897948_351343917065625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from radiator (highlighted by a red box)? Choose from studio couch (highlighted by a blue box) and furniture (highlighted by a green box).\n(A) studio couch\n(B) furniture" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898261_696948224876291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, book (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) book\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445613_56635809068833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) table\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115445_11769537267875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from picture frame (highlighted by a red box)? picture frame (highlighted by a blue box) or mattress (highlighted by a green box)?\n(A) picture frame\n(B) mattress" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896404_16747324087458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toaster (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) toaster\n(B) electric outlet" }, { "from": "gpt", "value": "(A) toaster" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670291_62232214309791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to studio couch (highlighted by a red box), light fixture (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) light fixture\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896378_20352538692125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) door\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261562_75476976651333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, doormat (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) doormat\n(B) toy" }, { "from": "gpt", "value": "(A) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115143_87050487082833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the magazine (highlighted by a red box)? magazine (highlighted by a blue box) or magazine (highlighted by a green box).\n(A) magazine\n(B) magazine" }, { "from": "gpt", "value": "(B) magazine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261645_633111373125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, swivel chair (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) swivel chair\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445692_63118675574958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to pillow (highlighted by a red box)? Select from chest of drawers (highlighted by a blue box) and nightstand (highlighted by a green box).\n(A) chest of drawers\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897822_132898286271041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895448_129487093084166_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458330_102957716836916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333110_108806393166583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, tap (highlighted by a red box) or soap dispenser (highlighted by a blue box)?\n(A) tap\n(B) soap dispenser" }, { "from": "gpt", "value": "(B) soap dispenser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896010_137008562056000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, curtain (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) curtain\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898449_3251382092750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897849_529455472366541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from tableware (highlighted by a red box)? Choose among these: countertop (highlighted by a blue box) or tableware (highlighted by a green box).\n(A) countertop\n(B) tableware" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897434_104263318549375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) chair\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897954_533751622759541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cleaning product (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) cleaning product\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662959_24603496945500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, faucet (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) faucet\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430217_180347210961416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, computer monitor (highlighted by a red box) or computer tower (highlighted by a blue box)?\n(A) computer monitor\n(B) computer tower" }, { "from": "gpt", "value": "(B) computer tower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204481_24838567806833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, box (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) box\n(B) cabinetry" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445206_10671921822500_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458607_125647599880583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of shaving cream (annotated by the red box) in relation to sink? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204377_18070231464458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, swivel chair (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) swivel chair\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899899_1026853431970541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, table lamp (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) table lamp\n(B) toy" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895956_133513158633000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from bottle (highlighted by a red box), bottle (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898696_580833692487833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cabinetry (highlighted by a red box) or exhaust hood (highlighted by a blue box)?\n(A) cabinetry\n(B) exhaust hood" }, { "from": "gpt", "value": "(B) exhaust hood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334267_156780267537958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to plain (highlighted by a red box)? Select from television (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) television\n(B) houseplant" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332585_360735948725791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, shelf (highlighted by a red box) or storage box (highlighted by a blue box)?\n(A) shelf\n(B) storage box" }, { "from": "gpt", "value": "(B) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261099_1008854285500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chest of drawers (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) chest of drawers\n(B) appliance" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261390_27751270329583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the curtain (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or coffee table (highlighted by a green box).\n(A) pillow\n(B) coffee table" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739969_18632382131125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from vase (highlighted by a red box)? Choose from writing (highlighted by a blue box) and flower (highlighted by a green box).\n(A) writing\n(B) flower" }, { "from": "gpt", "value": "(B) flower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331711_11317719630291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of air conditioning (annotated by the red box) in relation to cupboard? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115358_4169806373708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, curtain (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) curtain\n(B) picture frame" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896310_6779741377500_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796443_799418725541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, nightstand (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) nightstand\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333803_51472546353833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898261_697072523572083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from power outlet (highlighted by a red box)? Select from glass jar (highlighted by a blue box) and power outlet (highlighted by a green box).\n(A) glass jar\n(B) power outlet" }, { "from": "gpt", "value": "(A) glass jar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899909_1027571772906708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the pillow (highlighted by a red box)? furniture (highlighted by a blue box) or table (highlighted by a green box).\n(A) furniture\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331239_284185230784875_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430924_93010273900708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the studio couch (highlighted by a red box)? Choose among these: furniture (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) furniture\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669925_14061264246166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, picture frame (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) picture frame\n(B) shelf" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739678_749806337333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, furniture (highlighted by a red box) or window (highlighted by a blue box)?\n(A) furniture\n(B) window" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115624_3615100928708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) door\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896074_132742315110458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of blanket (annotated by the red box) in reference to waste container? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649603_35981599579166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, desk (highlighted by a red box) or pad (highlighted by a blue box)?\n(A) desk\n(B) pad" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334464_100949297838625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from coffee table (highlighted by a red box)? curtain (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) curtain\n(B) chair" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429886_367892632757708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from window (highlighted by a red box)? curtain (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) curtain\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828150_73448099237791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or step stool (highlighted by a blue box)?\n(A) furniture\n(B) step stool" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796473_4060625700250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, nightstand (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897462_470238067147500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from bar stool (highlighted by a red box)? Select from table (highlighted by a blue box) and stool (highlighted by a green box).\n(A) table\n(B) stool" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430439_1024147424833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, gas stove (highlighted by a red box) or food (highlighted by a blue box)?\n(A) gas stove\n(B) food" }, { "from": "gpt", "value": "(A) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446025_134661302693875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from book (highlighted by a red box)? Choose from book (highlighted by a blue box) and book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204761_26610202521166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, clock (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) clock\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332401_406041359024125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, lamp (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) lamp\n(B) lamp" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663363_91250698437583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from houseplant (highlighted by a red box), picture frame (highlighted by a blue box) or glass door (highlighted by a green box)?\n(A) picture frame\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445173_8131924253083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is rope (annotated by the red box) located relative to door?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897870_529970961484500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from toy (highlighted by a red box)? Choose from appliance (highlighted by a blue box) and toy (highlighted by a green box).\n(A) appliance\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446068_80623268290541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from toilet paper (highlighted by a red box)? Choose from path (highlighted by a blue box) and bath mat (highlighted by a green box).\n(A) path\n(B) bath mat" }, { "from": "gpt", "value": "(B) bath mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446466_355408459770666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from plain (highlighted by a red box)? Select from table (highlighted by a blue box) and animal (highlighted by a green box).\n(A) table\n(B) animal" }, { "from": "gpt", "value": "(B) animal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663317_76512775578541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, sink (highlighted by a red box) or plant (highlighted by a blue box)?\n(A) sink\n(B) plant" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332986_124526875157750_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649614_37054060599333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, shopping cart (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) shopping cart\n(B) toilet paper" }, { "from": "gpt", "value": "(A) shopping cart" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899271_883789099211375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, sink (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) sink\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331217_281124343564500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, window sill (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) window sill\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204275_12642464932375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018125_369116744300625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is glass door (annotated by the red box) located relative to door?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897875_342212306348583_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649408_10086392668625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to book (highlighted by a red box)? Select from shelf (highlighted by a blue box) and window screen (highlighted by a green box).\n(A) shelf\n(B) window screen" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669917_14142265495375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or file cabinet (highlighted by a blue box)?\n(A) picture frame\n(B) file cabinet" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663322_77643667649833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) table\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204505_864763577166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, appliance (highlighted by a red box) or table (highlighted by a blue box)?\n(A) appliance\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204763_26753609521125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of door (annotated by the red box) and door in the image provided, where is door (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649598_35850903758333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bowl (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895868_107586767113291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, lamp (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649772_43480714178666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to studio couch (highlighted by a red box)? Select from window (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334267_156790280104916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, picture frame (highlighted by a red box) or round table (highlighted by a blue box)?\n(A) picture frame\n(B) round table" }, { "from": "gpt", "value": "(B) round table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334039_278827108707166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, houseplant (highlighted by a red box) or flowerpot (highlighted by a blue box)?\n(A) houseplant\n(B) flowerpot" }, { "from": "gpt", "value": "(B) flowerpot" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204591_500218030083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) cabinetry\n(B) glass door" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334079_88667185464875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toiletry (highlighted by a red box)? mirror (highlighted by a blue box) or toothpaste (highlighted by a green box).\n(A) mirror\n(B) toothpaste" }, { "from": "gpt", "value": "(B) toothpaste" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897631_139557555191416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897955_216376021006083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to studio couch (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430439_1084456350250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to apple (highlighted by a red box)? Choose from glass jar (highlighted by a blue box) and countertop (highlighted by a green box).\n(A) glass jar\n(B) countertop" }, { "from": "gpt", "value": "(A) glass jar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331432_546041209991332_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is infant bed (annotated by the red box) located relative to toy? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334040_278958921735166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, kitchen appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) kitchen appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331103_135754873162416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444907_106176054612000_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896009_137244263755500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from bay window (highlighted by a red box)? Choose from window (highlighted by a blue box) and lighting (highlighted by a green box).\n(A) window\n(B) lighting" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458364_100680442485666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from pillow (highlighted by a red box)? Select from bed (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) bed\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333265_21692107388791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bottle (highlighted by a red box) or plastic bag (highlighted by a blue box)?\n(A) bottle\n(B) plastic bag" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261686_3803947208375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to starfish (highlighted by a red box)? fireplace (highlighted by a blue box) or fireplace (highlighted by a green box).\n(A) fireplace\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261241_15102005546000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to sleeping bag (highlighted by a red box), bookcase (highlighted by a blue box) or paperback book (highlighted by a green box)?\n(A) bookcase\n(B) paperback book" }, { "from": "gpt", "value": "(A) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898558_182002779539250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, swivel chair (highlighted by a red box) or computer monitor (highlighted by a blue box)?\n(A) swivel chair\n(B) computer monitor" }, { "from": "gpt", "value": "(B) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669937_14927490403208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bunk bed (highlighted by a red box)? Select from machine (highlighted by a blue box) and toy (highlighted by a green box).\n(A) machine\n(B) toy" }, { "from": "gpt", "value": "(A) machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333581_207688029113041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, rocking chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) rocking chair\n(B) table" }, { "from": "gpt", "value": "(A) rocking chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898477_157294718402458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from pillow (highlighted by a red box)? Choose among these: table (highlighted by a blue box) or mat (highlighted by a green box).\n(A) table\n(B) mat" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896587_32935239232000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhere is door (annotated by the red box) located in relation to bundle in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358472_46616371516666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, desk (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) desk\n(B) pillow" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663313_76568269276166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from swivel chair (highlighted by a red box), cabinetry (highlighted by a blue box) or radiator (highlighted by a green box)?\n(A) cabinetry\n(B) radiator" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899198_186493787833791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from radiator (highlighted by a red box)? Choose from wall clock (highlighted by a blue box) and table (highlighted by a green box).\n(A) wall clock\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331276_12775741688166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from plywood (highlighted by a red box)? dish washer (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) dish washer\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739276_42841471151791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the book (highlighted by a red box)? cabinetry (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) cabinetry\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334754_421207712026166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from bay window (highlighted by a red box)? air conditioner (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) air conditioner\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898039_222115325272541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from ceramic tile (highlighted by a red box)? Choose from chest of drawers (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) chest of drawers\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333847_74924629483541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), flower (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) flower\n(B) pillow" }, { "from": "gpt", "value": "(A) flower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261527_45664745394208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017887_80080909579000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the clothing (highlighted by a red box)? swivel chair (highlighted by a blue box) or closet (highlighted by a green box).\n(A) swivel chair\n(B) closet" }, { "from": "gpt", "value": "(B) closet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261167_1338258053625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the shelf (highlighted by a red box)? shelf (highlighted by a blue box) or book (highlighted by a green box).\n(A) shelf\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018156_373297073098208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to cabinetry (highlighted by a red box), shelf (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) shelf\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739479_52519122365833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from basket (highlighted by a red box), cabinet (highlighted by a blue box) or door (highlighted by a green box)?\n(A) cabinet\n(B) door" }, { "from": "gpt", "value": "(A) cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899936_863319473155333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), furniture (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) furniture\n(B) furniture" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895196_39125419584958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from tableware (highlighted by a red box), desk (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) desk\n(B) houseplant" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260889_8601502391791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from toiletry (highlighted by a red box)? bottle (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333666_131967097744166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from toy (highlighted by a red box)? Select from toy (highlighted by a blue box) and toy (highlighted by a green box).\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332316_390854663653750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, cabinetry (highlighted by a red box) or towel/napkin (highlighted by a blue box)?\n(A) cabinetry\n(B) towel/napkin" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333308_28103343763583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, curtain (highlighted by a red box) or vanity (highlighted by a blue box)?\n(A) curtain\n(B) vanity" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354751022005000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, shelf (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) shelf\n(B) bottle" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669934_14860183690916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, cleaning product (highlighted by a red box) or folding chair (highlighted by a blue box)?\n(A) cleaning product\n(B) folding chair" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649408_10116397469333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from door (highlighted by a red box)? ladder (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) ladder\n(B) chair" }, { "from": "gpt", "value": "(A) ladder" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332467_886366776861416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, appliance (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) appliance\n(B) mat" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429738_19830075180041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from curtain (highlighted by a red box)? Select from mattress (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) mattress\n(B) curtain" }, { "from": "gpt", "value": "(A) mattress" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669880_11262306994250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bar stool (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) bar stool\n(B) pillow" }, { "from": "gpt", "value": "(A) bar stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334609_385048660261833_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115137_85877831620750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, light bulb (highlighted by a red box) or shower (highlighted by a blue box)?\n(A) light bulb\n(B) shower" }, { "from": "gpt", "value": "(B) shower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828554_101403018667791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, stove (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) stove\n(B) appliance" }, { "from": "gpt", "value": "(A) stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334540_66359381639083_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334624_385764523487666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, table (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) table\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429721_18009343452500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bowl (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bowl\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331143_177732640722583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, mouthwash (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) mouthwash\n(B) toilet paper" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796562_15954475119250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) picture frame\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261314_22239938607625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window (highlighted by a red box), curtain (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) curtain\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898256_696568930935958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, computer desk (highlighted by a red box) or laptop keyboard (highlighted by a blue box)?\n(A) computer desk\n(B) laptop keyboard" }, { "from": "gpt", "value": "(B) laptop keyboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334672_391408104700166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, elevator (highlighted by a red box) or cupboard (highlighted by a blue box)?\n(A) elevator\n(B) cupboard" }, { "from": "gpt", "value": "(A) elevator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261313_22343845554958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to curtain (highlighted by a red box), table (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) table\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796279_912860688958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to toilet paper (highlighted by a red box)? Select from cleaning product (highlighted by a blue box) and toilet (highlighted by a green box).\n(A) cleaning product\n(B) toilet" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796721_27379886489208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to table (highlighted by a red box)? Select from window screen (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) window screen\n(B) cabinetry" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897462_470074068530250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, picture frame (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) picture frame\n(B) studio couch" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333268_22000315396875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, yoghurt (highlighted by a red box) or food (highlighted by a blue box)?\n(A) yoghurt\n(B) food" }, { "from": "gpt", "value": "(A) yoghurt" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334728_535773033166207_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or floral arrangement (highlighted by a blue box)?\n(A) chair\n(B) floral arrangement" }, { "from": "gpt", "value": "(B) floral arrangement" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898021_220961126561166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, curtain (highlighted by a red box) or window (highlighted by a blue box)?\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899970_654468751416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from person (highlighted by a red box)? Choose among these: studio couch (highlighted by a blue box) or window (highlighted by a green box).\n(A) studio couch\n(B) window" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897712_112041299337083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) table\n(B) appliance" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334070_87054415765208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bath mat (highlighted by a red box) or glass box (highlighted by a blue box)?\n(A) bath mat\n(B) glass box" }, { "from": "gpt", "value": "(A) bath mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896066_131832986234375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to appliance (highlighted by a red box), appliance (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) appliance\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358162_61044729886458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from door (highlighted by a red box)? door (highlighted by a blue box) or door (highlighted by a green box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333862_75556735489708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, tap (highlighted by a red box) or toilet (highlighted by a blue box)?\n(A) tap\n(B) toilet" }, { "from": "gpt", "value": "(B) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017884_79982799333375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window sill (highlighted by a red box) or closet (highlighted by a blue box)?\n(A) window sill\n(B) closet" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430937_94960538605583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, mouthwash (highlighted by a red box) or faucet (highlighted by a blue box)?\n(A) mouthwash\n(B) faucet" }, { "from": "gpt", "value": "(B) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333281_25688527909791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is basket container (annotated by the red box) located relative to chest of drawers?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331813_228706946610625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331298_14991938422333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from cabinet (highlighted by a red box)? glass jar (highlighted by a blue box) or shot glass (highlighted by a green box)?\n(A) glass jar\n(B) shot glass" }, { "from": "gpt", "value": "(B) shot glass" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332759_43354227610375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bidet (highlighted by a red box)? Choose among these: toilet (highlighted by a blue box) or bath (highlighted by a green box).\n(A) toilet\n(B) bath" }, { "from": "gpt", "value": "(A) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670028_32310502974958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the appliance (highlighted by a red box)? plant (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) plant\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358340_15275320809000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, counter top (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) counter top\n(B) tap" }, { "from": "gpt", "value": "(A) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895491_450900054568166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), toy (highlighted by a blue box) or toy (highlighted by a green box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896020_138384684306999_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, cabinetry (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) cabinetry\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018069_98100654224500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, toiletry (highlighted by a red box) or mirror (highlighted by a blue box)?\n(A) toiletry\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896083_144021894174208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, pillow (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) pillow\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430442_752457235750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, beer (highlighted by a red box) or beverage (highlighted by a blue box)?\n(A) beer\n(B) beverage" }, { "from": "gpt", "value": "(B) beverage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333673_134115767380415_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, curtain (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) curtain\n(B) screen door" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332489_341252589236875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bath towel (highlighted by a red box)? cleaning product (highlighted by a blue box) or tap (highlighted by a green box)?\n(A) cleaning product\n(B) tap" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828245_81749389625625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to cabinetry (highlighted by a red box)? Choose from curtain (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) curtain\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446462_354228435633791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, desk (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) desk\n(B) doormat" }, { "from": "gpt", "value": "(B) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896379_20394437954541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table lamp (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) table lamp\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333847_74947820091666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to table (highlighted by a red box)? Select from round table (highlighted by a blue box) and ipad (highlighted by a green box).\n(A) round table\n(B) ipad" }, { "from": "gpt", "value": "(A) round table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332833_32825913882166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, storage box (highlighted by a red box) or jacket (highlighted by a blue box)?\n(A) storage box\n(B) jacket" }, { "from": "gpt", "value": "(B) jacket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261228_13628719992541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or plain (highlighted by a blue box)?\n(A) door\n(B) plain" }, { "from": "gpt", "value": "(B) plain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828270_84279287986541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from appliance (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331347_192474519629333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, shelf (highlighted by a red box) or table (highlighted by a blue box)?\n(A) shelf\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334037_278530612453125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to laundry (highlighted by a red box), cabinetry (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) cabinetry\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897462_469893459838166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) picture frame\n(B) furniture" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899448_189694534488750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, door (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) door\n(B) curtain" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670291_62294223105083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the glass door (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663053_38553390989125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the chair (highlighted by a red box)? Choose among these: houseplant (highlighted by a blue box) or faucet (highlighted by a green box).\n(A) houseplant\n(B) faucet" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445612_56474009403375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to box (highlighted by a red box)? Select from chair (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) chair\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895611_470201403349833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to cabinetry (highlighted by a red box)? Choose from sink (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) sink\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018552_830377427615625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from plywood (highlighted by a red box)? electric outlet (highlighted by a blue box) or electric outlet (highlighted by a green box)?\n(A) electric outlet\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898242_695992806819875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, helmet (highlighted by a red box) or blanket (highlighted by a blue box)?\n(A) helmet\n(B) blanket" }, { "from": "gpt", "value": "(A) helmet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663415_95846675829708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, concrete (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) concrete\n(B) houseplant" }, { "from": "gpt", "value": "(A) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898560_183760603598666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the curtain (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or mirror (highlighted by a green box).\n(A) picture frame\n(B) mirror" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261248_15190802060041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or backpack (highlighted by a blue box)?\n(A) chair\n(B) backpack" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261294_16256835105791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bed (highlighted by a red box)? Select from screen door (highlighted by a blue box) and material (highlighted by a green box).\n(A) screen door\n(B) material" }, { "from": "gpt", "value": "(B) material" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_4952185971625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from curtain (highlighted by a red box)? cabinetry (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) cabinetry\n(B) furniture" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333826_53526857599625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to washing machine (highlighted by a red box)? Select from bottle (highlighted by a blue box) and waste (highlighted by a green box).\n(A) bottle\n(B) waste" }, { "from": "gpt", "value": "(B) waste" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334273_157183269515000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) picture frame\n(B) shelf" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444904_106271465619625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331627_20086042229541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, refrigerator (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) refrigerator\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331103_135738879653457_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from appliance (highlighted by a red box), bottle (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) bottle\n(B) appliance" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445206_10663925009250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from table lamp (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and fireplace (highlighted by a green box).\n(A) furniture\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24864495708750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, studio couch (highlighted by a red box) or bookshelf (highlighted by a blue box)?\n(A) studio couch\n(B) bookshelf" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897722_114308640915041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or picnic basket (highlighted by a blue box)?\n(A) door\n(B) picnic basket" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333475_58597731164916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of table (annotated by the red box) and pillow in the image provided, where is table (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358168_61132028707208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, curtain (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) curtain\n(B) curtain" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430795_60946063333125_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898625_757762503315958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, counter top (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) counter top\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670179_43173761344791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toiletry (highlighted by a red box)? toiletry (highlighted by a blue box) or toiletry (highlighted by a green box).\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896396_22564364511291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, mattress (highlighted by a red box) or animal (highlighted by a blue box)?\n(A) mattress\n(B) animal" }, { "from": "gpt", "value": "(A) mattress" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895633_471732094013083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to screen door (highlighted by a red box), window (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018549_830148020911750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from nightstand (highlighted by a red box)? pillow (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332396_401328814636041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445198_10941014911166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, studio couch (highlighted by a red box) or throw pillow (highlighted by a blue box)?\n(A) studio couch\n(B) throw pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334616_385496932612000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chair (highlighted by a red box)? computer monitor (highlighted by a blue box) or speaker (highlighted by a green box)?\n(A) computer monitor\n(B) speaker" }, { "from": "gpt", "value": "(B) speaker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445697_62707096447125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, swivel chair (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) swivel chair\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898899_816922737753541_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from material (highlighted by a red box)? chest of drawers (highlighted by a blue box) or countertop (highlighted by a green box)?\n(A) chest of drawers\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018106_368089719083666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, shelf (highlighted by a red box) or table (highlighted by a blue box)?\n(A) shelf\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458260_74333049330375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, tripod (highlighted by a red box) or closet (highlighted by a blue box)?\n(A) tripod\n(B) closet" }, { "from": "gpt", "value": "(A) tripod" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444875_99406250489750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of electric outlet (annotated by the red box) and furniture in the image provided, where is electric outlet (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115338_2289263475416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from door (highlighted by a red box)? Choose from chest of drawers (highlighted by a blue box) and door (highlighted by a green box).\n(A) chest of drawers\n(B) door" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897973_216851859935583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, countertop (highlighted by a red box) or wall clock (highlighted by a blue box)?\n(A) countertop\n(B) wall clock" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649464_13823136126541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334760_421805540438583_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899664_234679770276250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from clock (highlighted by a red box)? Choose from window (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) window\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430539_300337724160625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, animal (highlighted by a red box) or side cabinet (highlighted by a blue box)?\n(A) animal\n(B) side cabinet" }, { "from": "gpt", "value": "(A) animal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828369_92421021633041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the picture frame (highlighted by a red box)? picture frame (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) picture frame\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018608_633254505480041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332016_200804139998291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from light fixture (highlighted by a red box)? Choose from glass door (highlighted by a blue box) and shower curtain (highlighted by a green box).\n(A) glass door\n(B) shower curtain" }, { "from": "gpt", "value": "(B) shower curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334966_669396788837541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, furniture (highlighted by a red box) or door (highlighted by a blue box)?\n(A) furniture\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444787_50433105476791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window sill (highlighted by a red box), radiator (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) radiator\n(B) curtain" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446479_355578756985708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from furniture (highlighted by a red box)? Select from chair (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261562_75474977478500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, washing machine (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) washing machine\n(B) screen door" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358225_9595350188250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to magazine (highlighted by a red box)? mat (highlighted by a blue box) or paperback book (highlighted by a green box).\n(A) mat\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358660_1003187811916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, sink (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) sink\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017890_80982643455458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, appliance (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) appliance\n(B) ceramic tile" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358661_1192995971416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window screen (highlighted by a red box) or vase (highlighted by a blue box)?\n(A) window screen\n(B) vase" }, { "from": "gpt", "value": "(B) vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895571_1153716442672208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796590_17466475792500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to sink (highlighted by a red box)? ceramic tile (highlighted by a blue box) or shower (highlighted by a green box).\n(A) ceramic tile\n(B) shower" }, { "from": "gpt", "value": "(A) ceramic tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445135_5507036094333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is lamp (annotated by the red box) located relative to chest of drawers?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739479_52521121536333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898052_223237129478875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from curtain (highlighted by a red box)? Select from table lamp (highlighted by a blue box) and mechanical fan (highlighted by a green box).\n(A) table lamp\n(B) mechanical fan" }, { "from": "gpt", "value": "(B) mechanical fan" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739689_1075037988708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to table lamp (highlighted by a red box)? Choose from concrete (highlighted by a blue box) and nightstand (highlighted by a green box).\n(A) concrete\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018334_116209001734666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from bottle (highlighted by a red box)? Select from chair (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) chair\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458221_76874969809958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from blanket (highlighted by a red box)? Choose from paperback book (highlighted by a blue box) and paperback book (highlighted by a green box).\n(A) paperback book\n(B) paperback book" }, { "from": "gpt", "value": "(A) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429728_19253341326750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to chair (highlighted by a red box), computer desk (highlighted by a blue box) or toiletry (highlighted by a green box)?\n(A) computer desk\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204670_12411144355250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, paperback book (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) paperback book\n(B) shelf" }, { "from": "gpt", "value": "(A) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895593_1161508176760708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, cabinetry (highlighted by a red box) or clothe (highlighted by a blue box)?\n(A) cabinetry\n(B) clothe" }, { "from": "gpt", "value": "(B) clothe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24539512560833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chest of drawers (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) chest of drawers\n(B) toy" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899664_234633771813708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, armchair (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) armchair\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358327_18941674173083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897467_471529824648041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, houseplant (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) houseplant\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895287_80119053116750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to chest of drawers (highlighted by a red box), table lamp (highlighted by a blue box) or nightstand (highlighted by a green box)?\n(A) table lamp\n(B) nightstand" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458235_78477207131583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cabinetry (highlighted by a red box)? kitchen appliance (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) kitchen appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018811_19334475446125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from kitchen appliance (highlighted by a red box)? Choose from appliance (highlighted by a blue box) and chair (highlighted by a green box).\n(A) appliance\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204622_11849445834083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from curtain (highlighted by a red box), radiator (highlighted by a blue box) or table lamp (highlighted by a green box)?\n(A) radiator\n(B) table lamp" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669936_14789894859250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to door (highlighted by a red box), door (highlighted by a blue box) or clothing (highlighted by a green box)?\n(A) door\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662886_16455695493873_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or door (highlighted by a blue box)?\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897712_112133294212125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from sink (highlighted by a red box)? Choose among these: towel bar (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) towel bar\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446048_79961955602375_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332956_22074393447750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from picture frame (highlighted by a red box)? chair (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) chair\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334887_622550094051958_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458260_74256346313500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, screen door (highlighted by a red box) or stool (highlighted by a blue box)?\n(A) screen door\n(B) stool" }, { "from": "gpt", "value": "(B) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663349_91068803690833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window screen (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) window screen\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446598_210446187103125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, orange juice (highlighted by a red box) or table (highlighted by a blue box)?\n(A) orange juice\n(B) table" }, { "from": "gpt", "value": "(A) orange juice" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261087_390856177416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chicken (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) chicken\n(B) bath mat" }, { "from": "gpt", "value": "(A) chicken" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333233_32341465119166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, desk (highlighted by a red box) or animal (highlighted by a blue box)?\n(A) desk\n(B) animal" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796744_28834082319125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhere is furniture (annotated by the red box) located in relation to tube in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896209_2204174750083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) picture frame\n(B) basket" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331518_190830170236083_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796221_2071630431622_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the tap (highlighted by a red box)? bathtub (highlighted by a blue box) or sink (highlighted by a green box).\n(A) bathtub\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670250_63499116782958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) door\n(B) counter top" }, { "from": "gpt", "value": "(B) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649397_9507066166583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to screen door (highlighted by a red box), box (highlighted by a blue box) or door (highlighted by a green box)?\n(A) box\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204291_14470092350083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the blender (highlighted by a red box)? appliance (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334907_1086506929523208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, table (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261562_75472978305875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to washing machine (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and door (highlighted by a green box).\n(A) cabinetry\n(B) door" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897990_219023270989541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is picture frame (annotated by the red box) located relative to door?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334222_107137215348250_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429861_13409543481083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of studio couch (annotated by the red box) in relation to doormat? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895946_109167327365458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, vase (highlighted by a red box) or soap dispenser (highlighted by a blue box)?\n(A) vase\n(B) soap dispenser" }, { "from": "gpt", "value": "(B) soap dispenser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430509_299219656004208_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458369_100715045440750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) door\n(B) pillow" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649382_10508156725958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chest of drawers (highlighted by a red box) or drawer (highlighted by a blue box)?\n(A) chest of drawers\n(B) drawer" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204481_24856677304708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669880_11276301433291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from picture frame (highlighted by a red box)? chair (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333847_74953834322000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334178_350726963015875_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430068_34729393183916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toiletry (highlighted by a red box)? soap (highlighted by a blue box) or sink (highlighted by a green box).\n(A) soap\n(B) sink" }, { "from": "gpt", "value": "(A) soap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333812_52158562357791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, computer monitor (highlighted by a red box) or equipment (highlighted by a blue box)?\n(A) computer monitor\n(B) equipment" }, { "from": "gpt", "value": "(B) equipment" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430715_335369316388750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to lamp (highlighted by a red box)? Choose from mat (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) mat\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204377_18044225083125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to swivel chair (highlighted by a red box)? pillow (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) pillow\n(B) shelf" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444907_106168757590375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to glass plate (highlighted by a red box)? Select from pad (highlighted by a blue box) and pad (highlighted by a green box).\n(A) pad\n(B) pad" }, { "from": "gpt", "value": "(B) pad" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261326_23514278961666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, book (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) book\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895796_680729407518916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, book (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) book\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334185_354546264697458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to flower box (highlighted by a red box)? Select from flower (highlighted by a blue box) and window (highlighted by a green box).\n(A) flower\n(B) window" }, { "from": "gpt", "value": "(A) flower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261522_45767754649875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from pillow (highlighted by a red box)? pillow (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899318_887473497021333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from pillow (highlighted by a red box)? Select from bath (highlighted by a blue box) and bed (highlighted by a green box).\n(A) bath\n(B) bed" }, { "from": "gpt", "value": "(A) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332481_338815206832166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, doll (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) doll\n(B) radiator" }, { "from": "gpt", "value": "(A) doll" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445047_1899734637583_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334624_385770521035416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the appliance (highlighted by a red box)? swivel chair (highlighted by a blue box) or extension cord (highlighted by a green box).\n(A) swivel chair\n(B) extension cord" }, { "from": "gpt", "value": "(B) extension cord" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431103_348310079970375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, screen door (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) screen door\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261219_13578807397750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cabinetry (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) cabinetry\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669948_15416231587500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, plant (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) plant\n(B) radiator" }, { "from": "gpt", "value": "(A) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115358_4305799740041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the candle holder (highlighted by a red box)? Choose among these: nightstand (highlighted by a blue box) or radiator (highlighted by a green box).\n(A) nightstand\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669851_12491846990000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, picture frame (highlighted by a red box) or elevator (highlighted by a blue box)?\n(A) picture frame\n(B) elevator" }, { "from": "gpt", "value": "(B) elevator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332564_905960634379125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, book (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) book\n(B) table lamp" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445173_8111932204625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from curtain (highlighted by a red box)? radiator (highlighted by a blue box) or desk (highlighted by a green box)?\n(A) radiator\n(B) desk" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261294_16252836686083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toy (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) toy\n(B) chair" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331686_6600295948291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from radiator (highlighted by a red box)? Choose from chest of drawers (highlighted by a blue box) and cardboard box (highlighted by a green box).\n(A) chest of drawers\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898526_181071551247291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261507_43445526229041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, kitchen appliance (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) kitchen appliance\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331922_630791796432166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, pillow (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) pillow\n(B) electric outlet" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899011_640820624636250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) cabinetry\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261251_12653494149916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) picture frame\n(B) table lamp" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896491_31468136032875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from faucet (highlighted by a red box)? Choose among these: mirror (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) mirror\n(B) screen door" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663349_91070802900541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670183_43225057716833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, mouthwash (highlighted by a red box) or mouthwash (highlighted by a blue box)?\n(A) mouthwash\n(B) mouthwash" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332819_48921198995916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, material (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) material\n(B) concrete" }, { "from": "gpt", "value": "(A) material" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331495_153719007685875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to bottle (highlighted by a red box), bottle (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896209_2265382486958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, radiator (highlighted by a red box) or paper (highlighted by a blue box)?\n(A) radiator\n(B) paper" }, { "from": "gpt", "value": "(B) paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115165_88147471495833_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458599_125264954280708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, screen door (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) screen door\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444907_106133955105083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to electric outlet (highlighted by a red box)? television (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) television\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828498_101760701819583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the tile (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or step stool (highlighted by a green box).\n(A) chair\n(B) step stool" }, { "from": "gpt", "value": "(B) step stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458260_74252347893916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, computer monitor (highlighted by a red box) or crate (highlighted by a blue box)?\n(A) computer monitor\n(B) crate" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898254_696680035323458_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444708_73320669898083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chest of drawers (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) chest of drawers\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332107_683080711182375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, houseplant (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895199_39417917010166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204656_10843668090041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from appliance (highlighted by a red box)? Choose among these: toy (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) toy\n(B) cabinetry" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_4836198542875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to doormat (highlighted by a red box)? Choose from door (highlighted by a blue box) and radiator (highlighted by a green box).\n(A) door\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739960_18554779490750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to toy (highlighted by a red box), toy (highlighted by a blue box) or television (highlighted by a green box)?\n(A) toy\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896096_144218795878791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), television (highlighted by a blue box) or studio couch (highlighted by a green box)?\n(A) television\n(B) studio couch" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333298_26601941220500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from sink (highlighted by a red box)? tap (highlighted by a blue box) or plywood (highlighted by a green box)?\n(A) tap\n(B) plywood" }, { "from": "gpt", "value": "(A) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332022_202561199037166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, square (highlighted by a red box) or table (highlighted by a blue box)?\n(A) square\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895908_110740944192250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to chair (highlighted by a red box)? Choose from chair (highlighted by a blue box) and bed (highlighted by a green box).\n(A) chair\n(B) bed" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796438_678618901083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the radiator (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or mirror (highlighted by a green box).\n(A) cabinetry\n(B) mirror" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332795_47512005285666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, power outlet (highlighted by a red box) or window (highlighted by a blue box)?\n(A) power outlet\n(B) window" }, { "from": "gpt", "value": "(A) power outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430220_180132014533875_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331604_18578706862916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the basket (highlighted by a red box)? counter (highlighted by a blue box) or toiletry (highlighted by a green box).\n(A) counter\n(B) toiletry" }, { "from": "gpt", "value": "(A) counter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333636_123848996292708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, kitchen appliance (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) kitchen appliance\n(B) bottle" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895480_134475621171125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, box (highlighted by a red box) or handbag (highlighted by a blue box)?\n(A) box\n(B) handbag" }, { "from": "gpt", "value": "(B) handbag" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018846_649968409319500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, tablecloth (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) tablecloth\n(B) chair" }, { "from": "gpt", "value": "(A) tablecloth" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430928_92937570209916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, television (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) television\n(B) cabinetry" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358660_1007186230291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from countertop (highlighted by a red box)? counter (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) counter\n(B) cabinetry" }, { "from": "gpt", "value": "(A) counter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895591_1161460579367625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the door (highlighted by a red box)? screen door (highlighted by a blue box) or tile (highlighted by a green box).\n(A) screen door\n(B) tile" }, { "from": "gpt", "value": "(B) tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261355_25781233758375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bottle (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) bottle\n(B) appliance" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204481_24814577300458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to glass door (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and radiator (highlighted by a green box).\n(A) picture frame\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669851_12537861265083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or kitchen & dining room table (highlighted by a blue box)?\n(A) chair\n(B) kitchen & dining room table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670293_62030910572041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, lighting (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) lighting\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458452_118114131813833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, lamp (highlighted by a red box) or window (highlighted by a blue box)?\n(A) lamp\n(B) window" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897849_529443460605458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, curtain (highlighted by a red box) or floral arrangement (highlighted by a blue box)?\n(A) curtain\n(B) floral arrangement" }, { "from": "gpt", "value": "(B) floral arrangement" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333319_28607337553666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from table (highlighted by a red box)? studio couch (highlighted by a blue box) or vase (highlighted by a green box)?\n(A) studio couch\n(B) vase" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458511_113804650069958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to picture frame (highlighted by a red box)? Choose from light switch (highlighted by a blue box) and door (highlighted by a green box).\n(A) light switch\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333324_29322425196916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) chair\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897462_470168062883416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to fireplace (highlighted by a red box)? Select from mirror (highlighted by a blue box) and fireplace (highlighted by a green box).\n(A) mirror\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332792_47338292713541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to blanket (highlighted by a red box)? dresser (highlighted by a blue box) or chest of drawers (highlighted by a green box).\n(A) dresser\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458614_125668691536041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to plain (highlighted by a red box)? Choose from shower curtain (highlighted by a blue box) and sit (highlighted by a green box).\n(A) shower curtain\n(B) sit" }, { "from": "gpt", "value": "(B) sit" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334070_87062412531416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the sink (highlighted by a red box)? bath mat (highlighted by a blue box) or bathroom cabinet (highlighted by a green box).\n(A) bath mat\n(B) bathroom cabinet" }, { "from": "gpt", "value": "(B) bathroom cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670311_64334838697750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from table (highlighted by a red box)? window sill (highlighted by a blue box) or basket (highlighted by a green box)?\n(A) window sill\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898261_697072523572083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, power outlet (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) power outlet\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899353_715991473655000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, sink (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) sink\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331174_276462904319000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, clothing (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) clothing\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331591_16031979651083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670234_52930973823500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, shower curtain (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) shower curtain\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333308_28081336039333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895611_470246601682208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to toiletry (highlighted by a red box)? Choose from drawer (highlighted by a blue box) and sink (highlighted by a green box).\n(A) drawer\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649605_36463719872625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, door (highlighted by a red box) or light switch (highlighted by a blue box)?\n(A) door\n(B) light switch" }, { "from": "gpt", "value": "(B) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333523_50275198918041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bath mat (highlighted by a red box) or toilet bowl (highlighted by a blue box)?\n(A) bath mat\n(B) toilet bowl" }, { "from": "gpt", "value": "(A) bath mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895272_79416312400833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cabinetry (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) cabinetry\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430592_311063710372250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, storage box (highlighted by a red box) or box (highlighted by a blue box)?\n(A) storage box\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446497_357491731546583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, light switch (highlighted by a red box) or towel bar (highlighted by a blue box)?\n(A) light switch\n(B) towel bar" }, { "from": "gpt", "value": "(A) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429886_367902628708125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to radiator (highlighted by a red box)? Choose from chest of drawers (highlighted by a blue box) and furniture (highlighted by a green box).\n(A) chest of drawers\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333666_131937393146750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, toy (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) toy\n(B) shelf" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444869_97916885762291_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333801_51139548197083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bookshelf (highlighted by a red box)? Choose among these: paper towel (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) paper towel\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446444_82667320636333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from studio couch (highlighted by a red box), picture frame (highlighted by a blue box) or coffee table (highlighted by a green box)?\n(A) picture frame\n(B) coffee table" }, { "from": "gpt", "value": "(B) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018331_116105110296333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from silverware (highlighted by a red box)? Choose from utensil (highlighted by a blue box) and utensil (highlighted by a green box).\n(A) utensil\n(B) utensil" }, { "from": "gpt", "value": "(A) utensil" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739425_191758304232833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from flower (highlighted by a red box)? plant (highlighted by a blue box) or flower (highlighted by a green box)?\n(A) plant\n(B) flower" }, { "from": "gpt", "value": "(A) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669960_27607101375666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to picture frame (highlighted by a red box), door (highlighted by a blue box) or table (highlighted by a green box)?\n(A) door\n(B) table" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261686_3787953841916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897720_114136645704208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to armchair (highlighted by a red box)? table lamp (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) table lamp\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332026_202777494460666_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739960_18556778699625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, drawer (highlighted by a red box) or drawer (highlighted by a blue box)?\n(A) drawer\n(B) drawer" }, { "from": "gpt", "value": "(B) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796745_28649871940000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to window (highlighted by a red box)? pillow (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) pillow\n(B) lamp" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261598_52912392111500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from screen door (highlighted by a red box)? pillow (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649714_47800656510250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or material (highlighted by a blue box)?\n(A) chair\n(B) material" }, { "from": "gpt", "value": "(B) material" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739563_198356145510708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) door\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430808_64022195835000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) picture frame\n(B) curtain" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649774_43496108087791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897607_137263639362750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204451_22953178807416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, speaker (highlighted by a red box) or speaker (highlighted by a blue box)?\n(A) speaker\n(B) speaker" }, { "from": "gpt", "value": "(A) speaker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332591_362628079629583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bath mat (highlighted by a red box)? bath towel (highlighted by a blue box) or sink (highlighted by a green box).\n(A) bath towel\n(B) sink" }, { "from": "gpt", "value": "(A) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333283_25395431111125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the beach towel (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or table (highlighted by a green box).\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897643_146873878667125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from oven (highlighted by a red box)? Choose from gas stove (highlighted by a blue box) and microwave oven (highlighted by a green box).\n(A) gas stove\n(B) microwave oven" }, { "from": "gpt", "value": "(B) microwave oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895482_134803420928915_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895946_109227420269458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, sink (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) sink\n(B) bath mat" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739678_705807105125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, piano (highlighted by a red box) or window (highlighted by a blue box)?\n(A) piano\n(B) window" }, { "from": "gpt", "value": "(A) piano" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446579_205817445391625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the door (highlighted by a red box)? radiator (highlighted by a blue box) or bicycle (highlighted by a green box).\n(A) radiator\n(B) bicycle" }, { "from": "gpt", "value": "(B) bicycle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430293_187354353440833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, book (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) book\n(B) chair" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115415_4121960771082_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from mat (highlighted by a red box)? pillow (highlighted by a blue box) or table (highlighted by a green box)?\n(A) pillow\n(B) table" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018869_653374086375791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, desk (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) desk\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204786_27373568423250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, lamp (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) lamp\n(B) studio couch" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662806_13574880750583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is shelf (annotated by the red box) located relative to cabinet? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331507_155060221070458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, window (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) window\n(B) toy" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896591_32875729455082_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115287_118112032752708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to beverage (highlighted by a red box)? sink (highlighted by a blue box) or beverage (highlighted by a green box).\n(A) sink\n(B) beverage" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261153_587617659375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to fireplace (highlighted by a red box)? television (highlighted by a blue box) or furniture (highlighted by a green box).\n(A) television\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458315_102419155413958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from pillow (highlighted by a red box)? pillow (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115216_95053236908125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to window (highlighted by a red box)? Choose from studio couch (highlighted by a blue box) and coffee table (highlighted by a green box).\n(A) studio couch\n(B) coffee table" }, { "from": "gpt", "value": "(B) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115235_95849250098166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204744_25392177167125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, stool (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) stool\n(B) pillow" }, { "from": "gpt", "value": "(A) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333494_62223496152916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, cabinetry (highlighted by a red box) or couch (highlighted by a blue box)?\n(A) cabinetry\n(B) couch" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796507_3153608977458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, mirror (highlighted by a red box) or window (highlighted by a blue box)?\n(A) mirror\n(B) window" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895943_107789125066166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, screen door (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) screen door\n(B) mat" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897990_219031267771708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from pillow (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and bed (highlighted by a green box).\n(A) pillow\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334934_663247601642000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, houseplant (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) houseplant\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796722_27570977502583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) picture frame\n(B) houseplant" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261257_12730996862750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the table lamp (highlighted by a red box)? shelf (highlighted by a blue box) or armchair (highlighted by a green box).\n(A) shelf\n(B) armchair" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261331_24062936515625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from towel bar (highlighted by a red box)? Select from door (highlighted by a blue box) and toiletry (highlighted by a green box).\n(A) door\n(B) toiletry" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334849_615462535084333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358118_62537294333750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from appliance (highlighted by a red box), appliance (highlighted by a blue box) or oven (highlighted by a green box)?\n(A) appliance\n(B) oven" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458260_74325052491958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, table (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) table\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331910_627571874897125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, studio couch (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) studio couch\n(B) mat" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898687_577212902154625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, sink (highlighted by a red box) or toilet bowl (highlighted by a blue box)?\n(A) sink\n(B) toilet bowl" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899559_199462701351625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from tap (highlighted by a red box)? Choose among these: sink (highlighted by a blue box) or tile (highlighted by a green box).\n(A) sink\n(B) tile" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332107_683126709347083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, screen door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) screen door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261651_1359024235041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to studio couch (highlighted by a red box)? Select from curtain (highlighted by a blue box) and nightstand (highlighted by a green box).\n(A) curtain\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445935_79412965900375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to table (highlighted by a red box)? Choose from christmas decoration (highlighted by a blue box) and radiator (highlighted by a green box).\n(A) christmas decoration\n(B) radiator" }, { "from": "gpt", "value": "(A) christmas decoration" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897756_117668517396666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to electric outlet (highlighted by a red box)? Choose from book (highlighted by a blue box) and book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333618_76385731484791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to window sill (highlighted by a red box)? houseplant (highlighted by a blue box) or table (highlighted by a green box).\n(A) houseplant\n(B) table" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899053_646955293255041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from studio couch (highlighted by a red box), pillow (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895469_132829918352125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, armchair (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) armchair\n(B) armchair" }, { "from": "gpt", "value": "(B) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331365_195078386952916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, lamp (highlighted by a red box) or window (highlighted by a blue box)?\n(A) lamp\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332207_264597781816083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to table (highlighted by a red box)? Select from toy (highlighted by a blue box) and toy (highlighted by a green box).\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458549_127609323049333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table (highlighted by a red box) or plant (highlighted by a blue box)?\n(A) table\n(B) plant" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334672_391428113259833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, shelf (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) shelf\n(B) shelf" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204919_3660490891291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, door (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) door\n(B) screen door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261728_2852298383666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the appliance (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or exhaust hood (highlighted by a green box).\n(A) appliance\n(B) exhaust hood" }, { "from": "gpt", "value": "(B) exhaust hood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334459_100776184973708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bottle (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) bottle\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649478_14885532262625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), pillow (highlighted by a blue box) or studio couch (highlighted by a green box)?\n(A) pillow\n(B) studio couch" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332810_48260832304541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, refrigerator (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) refrigerator\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429804_737539529296916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, houseplant (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) houseplant\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334207_103261792279875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from flower (highlighted by a red box)? Choose from houseplant (highlighted by a blue box) and door (highlighted by a green box).\n(A) houseplant\n(B) door" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649774_43594202600708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chest of drawers (highlighted by a red box) or door (highlighted by a blue box)?\n(A) chest of drawers\n(B) door" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896404_16761318530541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, furniture (highlighted by a red box) or stairwell (highlighted by a blue box)?\n(A) furniture\n(B) stairwell" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018524_821517995116416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bed (highlighted by a red box)? nightstand (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334935_663022892760250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of furniture (annotated by the red box) in reference to furniture?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333649_126254524534416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, lamp (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) lamp\n(B) curtain" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204585_586617212375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from cabinetry (highlighted by a red box), screen door (highlighted by a blue box) or light fixture (highlighted by a green box)?\n(A) screen door\n(B) light fixture" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895946_109225421060333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895911_111534842540375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from bottle (highlighted by a red box)? brush (highlighted by a blue box) or toiletry (highlighted by a green box)?\n(A) brush\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898571_183795089944583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, couch (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) couch\n(B) screen door" }, { "from": "gpt", "value": "(A) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896089_143902093756041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, doormat (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) doormat\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899352_715969282859708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from counter top (highlighted by a red box)? Select from luggage (highlighted by a blue box) and concrete (highlighted by a green box).\n(A) luggage\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204305_15268270272916_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897945_351430714516875_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window (highlighted by a red box), picture frame (highlighted by a blue box) or christmas tree (highlighted by a green box)?\n(A) picture frame\n(B) christmas tree" }, { "from": "gpt", "value": "(B) christmas tree" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261675_3119444888916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, sheet (highlighted by a red box) or sheet (highlighted by a blue box)?\n(A) sheet\n(B) sheet" }, { "from": "gpt", "value": "(A) sheet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739563_198368157428208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the light fixture (highlighted by a red box)? light fixture (highlighted by a blue box) or floral arrangement (highlighted by a green box).\n(A) light fixture\n(B) floral arrangement" }, { "from": "gpt", "value": "(A) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333826_53470847064791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, water heater (highlighted by a red box) or towel (highlighted by a blue box)?\n(A) water heater\n(B) towel" }, { "from": "gpt", "value": "(B) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429739_20236859424375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cabinetry (highlighted by a red box)? Choose from window frame (highlighted by a blue box) and mirror (highlighted by a green box).\n(A) window frame\n(B) mirror" }, { "from": "gpt", "value": "(A) window frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333600_75341790617625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11293699990458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, lamp (highlighted by a red box) or candle holder (highlighted by a blue box)?\n(A) lamp\n(B) candle holder" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739353_186914791676458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to towel (highlighted by a red box)? Select from bathtub (highlighted by a blue box) and towel (highlighted by a green box).\n(A) bathtub\n(B) towel" }, { "from": "gpt", "value": "(B) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018315_109642753440000_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445736_64093493822500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from toaster (highlighted by a red box)? bottle (highlighted by a blue box) or counter (highlighted by a green box)?\n(A) bottle\n(B) counter" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261172_1552056879833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from vase (highlighted by a red box)? Choose from bottle (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) bottle\n(B) houseplant" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430795_60932068997625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from closet (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and bed (highlighted by a green box).\n(A) picture frame\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445695_57398291976916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from ladder (highlighted by a red box)? Choose from folding chair (highlighted by a blue box) and helmet (highlighted by a green box).\n(A) folding chair\n(B) helmet" }, { "from": "gpt", "value": "(B) helmet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430809_64084603945250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, curtain (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) curtain\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669959_27742095445708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, swivel chair (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) swivel chair\n(B) cabinetry" }, { "from": "gpt", "value": "(A) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115238_97826881446875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from computer monitor (highlighted by a red box), studio couch (highlighted by a blue box) or entertainment center (highlighted by a green box)?\n(A) studio couch\n(B) entertainment center" }, { "from": "gpt", "value": "(B) entertainment center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11205703221833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bookcase (highlighted by a red box)? Select from table (highlighted by a blue box) and tableware (highlighted by a green box).\n(A) table\n(B) tableware" }, { "from": "gpt", "value": "(B) tableware" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898701_580975983853791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) cabinetry\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333268_21988320290500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) table\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430934_94899030238541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, cabinet (highlighted by a red box) or washing machine (highlighted by a blue box)?\n(A) cabinet\n(B) washing machine" }, { "from": "gpt", "value": "(A) cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332066_250032787470958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the door (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or frying pan (highlighted by a green box).\n(A) door\n(B) frying pan" }, { "from": "gpt", "value": "(B) frying pan" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261509_43566428421916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from light switch (highlighted by a red box)? door (highlighted by a blue box) or glass door (highlighted by a green box)?\n(A) door\n(B) glass door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458572_296176117875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, home appliance (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) home appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017888_79783313182958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bed (highlighted by a red box) or dresser (highlighted by a blue box)?\n(A) bed\n(B) dresser" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358362_16387367203250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to table (highlighted by a red box)? Choose from magazine (highlighted by a blue box) and couch (highlighted by a green box).\n(A) magazine\n(B) couch" }, { "from": "gpt", "value": "(A) magazine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331277_13143841425333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to paperback book (highlighted by a red box), floral arrangement (highlighted by a blue box) or paperback book (highlighted by a green box)?\n(A) floral arrangement\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018286_799469519504791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or door (highlighted by a blue box)?\n(A) furniture\n(B) door" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334057_86249990752125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, studio couch (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) studio couch\n(B) radiator" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899642_232057189424583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhere is stool (annotated by the red box) located in relation to swivel chair in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444712_73973717040041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is curtain (annotated by the red box) located in relation to door in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333292_26371536093291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to toilet paper (highlighted by a red box)? Select from bottle (highlighted by a blue box) and toilet paper (highlighted by a green box).\n(A) bottle\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333574_207483828127708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) table\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895861_489081051641958_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895987_136428104270250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, book (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) book\n(B) paperback book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204832_610047747458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) chair\n(B) curtain" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897643_146920176689375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the mat (highlighted by a red box)? Choose among these: chair (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) chair\n(B) houseplant" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897955_216402826888666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) table\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895491_450912066364875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) chair\n(B) desk" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796208_1591464708750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bed (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) bed\n(B) electric outlet" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458587_1595074546625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331910_627579871674791_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739716_3200769751208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window (highlighted by a red box) or soap dispenser (highlighted by a blue box)?\n(A) window\n(B) soap dispenser" }, { "from": "gpt", "value": "(B) soap dispenser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896038_130000948060791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of shelf (annotated by the red box) in relation to window blind?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896510_33449375593791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to plain (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and coffee table (highlighted by a green box).\n(A) picture frame\n(B) coffee table" }, { "from": "gpt", "value": "(B) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898393_369393418151125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bed (highlighted by a red box)? Choose among these: laundry basket (highlighted by a blue box) or nightstand (highlighted by a green box).\n(A) laundry basket\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115177_104329238346666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) curtain\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739276_42889467880833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to chair (highlighted by a red box)? Choose from throw pillow (highlighted by a blue box) and chair (highlighted by a green box).\n(A) throw pillow\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896587_32913231272541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895903_493405656358583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to picture frame (highlighted by a red box), microwave oven (highlighted by a blue box) or table (highlighted by a green box)?\n(A) microwave oven\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447287_408822598604541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, counter top (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) counter top\n(B) cabinetry" }, { "from": "gpt", "value": "(A) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828233_69834333154333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or window (highlighted by a blue box)?\n(A) picture frame\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333673_134097758037125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from clothing (highlighted by a red box), infant bed (highlighted by a blue box) or clothing (highlighted by a green box)?\n(A) infant bed\n(B) clothing" }, { "from": "gpt", "value": "(A) infant bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333264_21807810463833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from bottle (highlighted by a red box), appliance (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670023_32294609257166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to lamp (highlighted by a red box), electric outlet (highlighted by a blue box) or window screen (highlighted by a green box)?\n(A) electric outlet\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333624_77207659252708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is person (annotated by the red box) located relative to houseplant?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662897_19427193753833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, ball (highlighted by a red box) or television (highlighted by a blue box)?\n(A) ball\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649634_39435954010708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) chair\n(B) bath mat" }, { "from": "gpt", "value": "(B) bath mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430452_1933645962333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from wood (highlighted by a red box), television (highlighted by a blue box) or table lamp (highlighted by a green box)?\n(A) television\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458249_79410164842958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window frame (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) window frame\n(B) cleaning product" }, { "from": "gpt", "value": "(A) window frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739925_16346465726500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chest of drawers (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) chest of drawers\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899198_186610172930000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window (highlighted by a red box)? Select from animal (highlighted by a blue box) and plant (highlighted by a green box).\n(A) animal\n(B) plant" }, { "from": "gpt", "value": "(B) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018264_793751070016541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, electric outlet (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) electric outlet\n(B) bed" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331938_164845616323791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of pillow (annotated by the red box) in reference to material?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446607_88154785333000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, pillow (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) pillow\n(B) picture frame" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333308_28025342059166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from coffee cup (highlighted by a red box), table (highlighted by a blue box) or microwave oven (highlighted by a green box)?\n(A) table\n(B) microwave oven" }, { "from": "gpt", "value": "(B) microwave oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018788_17546052027041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from light switch (highlighted by a red box)? table (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649775_43382303095541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, pillow (highlighted by a red box) or window (highlighted by a blue box)?\n(A) pillow\n(B) window" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331766_7403949095458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899944_864856039493958_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334273_157195264593291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, countertop (highlighted by a red box) or food (highlighted by a blue box)?\n(A) countertop\n(B) food" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897480_470977420373208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796214_2020418362000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, mirror (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) mirror\n(B) curtain" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332201_264350382229166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to picture frame (highlighted by a red box)? Select from toy (highlighted by a blue box) and toy (highlighted by a green box).\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796227_2493415551083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from nightstand (highlighted by a red box)? pillow (highlighted by a blue box) or window (highlighted by a green box)?\n(A) pillow\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333293_26516626429541_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from garden hose (highlighted by a red box), soap (highlighted by a blue box) or soap (highlighted by a green box)?\n(A) soap\n(B) soap" }, { "from": "gpt", "value": "(A) soap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018760_15075346626250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, houseplant (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) houseplant\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662831_15040005763083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the kitchen appliance (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or light fixture (highlighted by a green box).\n(A) appliance\n(B) light fixture" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334754_421215708789625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from door (highlighted by a red box)? door (highlighted by a blue box) or mirror (highlighted by a green box)?\n(A) door\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24427808363250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from chair (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445169_7795225227541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from lamp (highlighted by a red box)? Choose among these: bay window (highlighted by a blue box) or fireplace (highlighted by a green box).\n(A) bay window\n(B) fireplace" }, { "from": "gpt", "value": "(A) bay window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334489_104638229595166_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24764503506791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895279_79289913788250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, door (highlighted by a red box) or television (highlighted by a blue box)?\n(A) door\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261230_13425321022791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from plant (highlighted by a red box)? Choose among these: kitchen & dining room table (highlighted by a blue box) or chair (highlighted by a green box).\n(A) kitchen & dining room table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895789_678564224035375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, nightstand (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430978_101810919472958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table (highlighted by a red box) or throw pillow (highlighted by a blue box)?\n(A) table\n(B) throw pillow" }, { "from": "gpt", "value": "(B) throw pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332473_886594168472416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bath mat (highlighted by a red box)? tap (highlighted by a blue box) or kettle (highlighted by a green box)?\n(A) tap\n(B) kettle" }, { "from": "gpt", "value": "(B) kettle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670075_38545509879958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, coffee table (highlighted by a red box) or board game (highlighted by a blue box)?\n(A) coffee table\n(B) board game" }, { "from": "gpt", "value": "(B) board game" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670048_33404908551000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to toy (highlighted by a red box)? Choose from toy (highlighted by a blue box) and toy (highlighted by a green box).\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018800_18803683636333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, studio couch (highlighted by a red box) or nightstand (highlighted by a blue box)?\n(A) studio couch\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796579_16786173682916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from window (highlighted by a red box)? picture frame (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896487_23762802410916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) door\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018828_647400971236875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, shower curtain (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) shower curtain\n(B) shelf" }, { "from": "gpt", "value": "(A) shower curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897605_137295643097333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from glass door (highlighted by a red box)? Select from pillow (highlighted by a blue box) and light fixture (highlighted by a green box).\n(A) pillow\n(B) light fixture" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796684_30790947047916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, cabinetry (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) cabinetry\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897512_472714500659166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to box (highlighted by a red box), workbench (highlighted by a blue box) or box (highlighted by a green box)?\n(A) workbench\n(B) box" }, { "from": "gpt", "value": "(A) workbench" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444738_77960396573208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from door (highlighted by a red box)? book (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) book\n(B) curtain" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896461_21732891037958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from bathroom cabinet (highlighted by a red box)? Choose from towel bar (highlighted by a blue box) and tap (highlighted by a green box).\n(A) towel bar\n(B) tap" }, { "from": "gpt", "value": "(A) towel bar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649382_10502159208708_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358118_62587390265666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from coffee machine (highlighted by a red box)? Choose among these: kitchen appliance (highlighted by a blue box) or countertop (highlighted by a green box).\n(A) kitchen appliance\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261395_29046955054458_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649615_36964264558666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, door (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) door\n(B) ceramic tile" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828243_81864991772833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from nightstand (highlighted by a red box)? pillow (highlighted by a blue box) or charger (highlighted by a green box)?\n(A) pillow\n(B) charger" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670044_33319409063708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from toy (highlighted by a red box)? Choose from plain (highlighted by a blue box) and toy (highlighted by a green box).\n(A) plain\n(B) toy" }, { "from": "gpt", "value": "(A) plain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796520_4047811230791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toilet (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) toilet\n(B) ceramic tile" }, { "from": "gpt", "value": "(A) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445729_63901805687583_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896551_30292891529291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to nightstand (highlighted by a red box), table lamp (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334729_535888136353165_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, television (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) television\n(B) appliance" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896527_34748917602666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, storage box (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) storage box\n(B) basket" }, { "from": "gpt", "value": "(A) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649798_46222610507416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, sink (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) sink\n(B) bottle" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669881_10930904976541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, window screen (highlighted by a red box) or window (highlighted by a blue box)?\n(A) window screen\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333249_33640413181958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, poster (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) poster\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739916_15639386147625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the door (highlighted by a red box)? Choose among these: window (highlighted by a blue box) or light switch (highlighted by a green box).\n(A) window\n(B) light switch" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662886_16447682002041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, glass bowl (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) glass bowl\n(B) radiator" }, { "from": "gpt", "value": "(A) glass bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895719_373260090885291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to brush (highlighted by a red box)? Select from toilet (highlighted by a blue box) and cleaning product (highlighted by a green box).\n(A) toilet\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897732_115047390224125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or laptop (highlighted by a blue box)?\n(A) chair\n(B) laptop" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649603_36103598892875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649478_15107127877916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from table (highlighted by a red box)? Select from book (highlighted by a blue box) and throw pillow (highlighted by a green box).\n(A) book\n(B) throw pillow" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260952_6058303312666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window (highlighted by a red box) or table (highlighted by a blue box)?\n(A) window\n(B) table" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11177698177291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, armchair (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) armchair\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42923207_1803106137291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, electric outlet (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) electric outlet\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899003_640621723000833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to kitchen appliance (highlighted by a red box)? Choose from footwear (highlighted by a blue box) and kitchen appliance (highlighted by a green box).\n(A) footwear\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898680_576483887437083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from shower (highlighted by a red box), bath towel (highlighted by a blue box) or counter top (highlighted by a green box)?\n(A) bath towel\n(B) counter top" }, { "from": "gpt", "value": "(B) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444928_221430384975791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from desk (highlighted by a red box)? Choose among these: swivel chair (highlighted by a blue box) or book (highlighted by a green box).\n(A) swivel chair\n(B) book" }, { "from": "gpt", "value": "(A) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358729_6609221315958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to radiator (highlighted by a red box)? curtain (highlighted by a blue box) or chair (highlighted by a green box).\n(A) curtain\n(B) chair" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115624_3661099403291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from washing machine (highlighted by a red box)? drawer (highlighted by a blue box) or drawer (highlighted by a green box)?\n(A) drawer\n(B) drawer" }, { "from": "gpt", "value": "(B) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895816_685901832794250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, drawer (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) drawer\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896466_21874784890208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or glass vase (highlighted by a blue box)?\n(A) table\n(B) glass vase" }, { "from": "gpt", "value": "(B) glass vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332177_262496314933125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chest of drawers (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) chest of drawers\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331498_153864315460541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, medicine cabinet (highlighted by a red box) or toilet (highlighted by a blue box)?\n(A) medicine cabinet\n(B) toilet" }, { "from": "gpt", "value": "(B) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662800_12916675326083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the window sill (highlighted by a red box)? studio couch (highlighted by a blue box) or window (highlighted by a green box).\n(A) studio couch\n(B) window" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332751_42653714561750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, light switch (highlighted by a red box) or light switch (highlighted by a blue box)?\n(A) light switch\n(B) light switch" }, { "from": "gpt", "value": "(B) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331049_482392414394833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, electric outlet (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) electric outlet\n(B) lamp" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828486_100898455797666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from chair (highlighted by a red box)? Choose among these: radiator (highlighted by a blue box) or book (highlighted by a green box).\n(A) radiator\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458634_127513885352291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is studio couch (annotated by the red box) located relative to pillow? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358225_9613342725666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from book (highlighted by a red box)? Choose from book (highlighted by a blue box) and coffee table (highlighted by a green box).\n(A) book\n(B) coffee table" }, { "from": "gpt", "value": "(B) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333031_59022938216666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, coffee table (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) coffee table\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261087_400868704333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from toy (highlighted by a red box)? Select from footwear (highlighted by a blue box) and footwear (highlighted by a green box).\n(A) footwear\n(B) footwear" }, { "from": "gpt", "value": "(A) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115129_85583056078791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, electric outlet (highlighted by a red box) or shower (highlighted by a blue box)?\n(A) electric outlet\n(B) shower" }, { "from": "gpt", "value": "(B) shower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828368_92201629078125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the appliance (highlighted by a red box)? window sill (highlighted by a blue box) or countertop (highlighted by a green box).\n(A) window sill\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429821_744448899904750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, studio couch (highlighted by a red box) or drawer (highlighted by a blue box)?\n(A) studio couch\n(B) drawer" }, { "from": "gpt", "value": "(B) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018802_18905692386250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, studio couch (highlighted by a red box) or nightstand (highlighted by a blue box)?\n(A) studio couch\n(B) nightstand" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334767_424047835165416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the sink (highlighted by a red box)? Choose among these: toothbrush (highlighted by a blue box) or soap dispenser (highlighted by a green box).\n(A) toothbrush\n(B) soap dispenser" }, { "from": "gpt", "value": "(B) soap dispenser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897804_131420407720416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, appliance (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) appliance\n(B) ceramic tile" }, { "from": "gpt", "value": "(B) ceramic tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796227_2479421369166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) curtain\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445684_61857661956666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or plank (highlighted by a blue box)?\n(A) door\n(B) plank" }, { "from": "gpt", "value": "(B) plank" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331128_174101237915291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from floral arrangement (highlighted by a red box)? Choose from book (highlighted by a blue box) and book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899653_233556473330083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) couch\n(B) pillow" }, { "from": "gpt", "value": "(A) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898055_223322528305375_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670039_32827320917166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of door (annotated by the red box) and window in the image provided, where is door (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446445_354403130986333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from pillow (highlighted by a red box)? Choose from bean bag chair (highlighted by a blue box) and furniture (highlighted by a green box).\n(A) bean bag chair\n(B) furniture" }, { "from": "gpt", "value": "(A) bean bag chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895956_133461163490875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) table\n(B) cabinetry" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261384_27719066396458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to studio couch (highlighted by a red box)? Choose from window screen (highlighted by a blue box) and couch (highlighted by a green box).\n(A) window screen\n(B) couch" }, { "from": "gpt", "value": "(B) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332044_207167382906416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, microwave (highlighted by a red box) or floral arrangement (highlighted by a blue box)?\n(A) microwave\n(B) floral arrangement" }, { "from": "gpt", "value": "(A) microwave" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898586_184290175222125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, appliance (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) appliance\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796721_27367874571666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) cabinetry\n(B) fireplace" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445585_283564773227750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, furniture (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) furniture\n(B) footwear" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895469_132742021086166_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334756_421306505361208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, flowerpot (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) flowerpot\n(B) window sill" }, { "from": "gpt", "value": "(A) flowerpot" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670271_66564412373375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, floral arrangement (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) floral arrangement\n(B) tap" }, { "from": "gpt", "value": "(A) floral arrangement" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018639_635865870582041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261294_16248838266333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from shutter (highlighted by a red box)? Select from table (highlighted by a blue box) and shutter (highlighted by a green box).\n(A) table\n(B) shutter" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204857_1583624381541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to bathroom cabinet (highlighted by a red box)? bath (highlighted by a blue box) or bath towel (highlighted by a green box).\n(A) bath\n(B) bath towel" }, { "from": "gpt", "value": "(A) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898530_181138757996000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), table (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333803_51392545547500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from book (highlighted by a red box), book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458519_113933549091000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bed (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) bed\n(B) radiator" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670016_30465981990916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333060_60834762900250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bath towel (highlighted by a red box)? bottle (highlighted by a blue box) or counter top (highlighted by a green box).\n(A) bottle\n(B) counter top" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445599_285107824079625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from electric outlet (highlighted by a red box)? electric outlet (highlighted by a blue box) or chest of drawers (highlighted by a green box)?\n(A) electric outlet\n(B) chest of drawers" }, { "from": "gpt", "value": "(B) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446561_86473464949416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) furniture\n(B) furniture" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018328_116007899478041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the appliance (highlighted by a red box)? curtain (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) curtain\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670328_65783785683458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to picture frame (highlighted by a red box)? door (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) door\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796752_29846760316208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, ball (highlighted by a red box) or bean bag chair (highlighted by a blue box)?\n(A) ball\n(B) bean bag chair" }, { "from": "gpt", "value": "(B) bean bag chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895287_80141643990958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, teddy (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) teddy\n(B) radiator" }, { "from": "gpt", "value": "(A) teddy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739418_191250670897583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, radiator (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) radiator\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444750_79664474342125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from kitchen appliance (highlighted by a red box)? gas stove (highlighted by a blue box) or washing machine (highlighted by a green box)?\n(A) gas stove\n(B) washing machine" }, { "from": "gpt", "value": "(B) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115501_12487906640041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to curtain (highlighted by a red box)? lamp (highlighted by a blue box) or shoe (highlighted by a green box).\n(A) lamp\n(B) shoe" }, { "from": "gpt", "value": "(B) shoe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115265_115137263561291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, door (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) door\n(B) radiator" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897480_470915129352833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662959_24611593743875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, footrest (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) footrest\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332473_886576175743041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from appliance (highlighted by a red box)? Choose from window (highlighted by a blue box) and toy (highlighted by a green box).\n(A) window\n(B) toy" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739595_199706687892500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chest of drawers (highlighted by a red box) or tool (highlighted by a blue box)?\n(A) chest of drawers\n(B) tool" }, { "from": "gpt", "value": "(B) tool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331003_178755727710500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, table (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) table\n(B) bed" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446068_80621269119875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the material (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or bathtub (highlighted by a green box).\n(A) picture frame\n(B) bathtub" }, { "from": "gpt", "value": "(B) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429766_358310148539333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, mirror (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) mirror\n(B) screen door" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334172_350745555477333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261317_23593479430833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the shelf (highlighted by a red box)? book (highlighted by a blue box) or book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115227_95980845318250_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796514_3263215585083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from window (highlighted by a red box)? Choose among these: footwear (highlighted by a blue box) or table (highlighted by a green box).\n(A) footwear\n(B) table" }, { "from": "gpt", "value": "(A) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332469_886451276148416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window (highlighted by a red box), alphabet (highlighted by a blue box) or mug (highlighted by a green box)?\n(A) alphabet\n(B) mug" }, { "from": "gpt", "value": "(A) alphabet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445587_284507133096958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bath mat (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) bath mat\n(B) bath mat" }, { "from": "gpt", "value": "(B) bath mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11187710689500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, book (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) book\n(B) mat" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897462_470254060500500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from mirror (highlighted by a red box)? studio couch (highlighted by a blue box) or glass door (highlighted by a green box)?\n(A) studio couch\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899185_184275191631166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) door\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261658_1205337970875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhere is door (annotated by the red box) located in relation to door in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333801_51117240557541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the toy (highlighted by a red box)? Choose among these: furniture (highlighted by a blue box) or toy (highlighted by a green box).\n(A) furniture\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649399_9720065248458_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429798_737337926982125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from cabinetry (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204820_28665220653791_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261087_362867748375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from appliance (highlighted by a red box)? Choose among these: bookshelf (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) bookshelf\n(B) bottle" }, { "from": "gpt", "value": "(A) bookshelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796475_4326732067416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, paperback book (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) paperback book\n(B) toy" }, { "from": "gpt", "value": "(A) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670295_63442240491166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the notepad (highlighted by a red box)? computer monitor (highlighted by a blue box) or chair (highlighted by a green box).\n(A) computer monitor\n(B) chair" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895491_450914065553916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or swivel chair (highlighted by a blue box)?\n(A) table\n(B) swivel chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895825_1220067278352291_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261645_635110544958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, table (highlighted by a red box) or dog bed (highlighted by a blue box)?\n(A) table\n(B) dog bed" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899362_717650292218625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739301_43627264359000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bottle (highlighted by a red box)? trash bin/can (highlighted by a blue box) or laundry (highlighted by a green box)?\n(A) trash bin/can\n(B) laundry" }, { "from": "gpt", "value": "(B) laundry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796221_2063617090833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to window (highlighted by a red box)? bathroom cabinet (highlighted by a blue box) or tap (highlighted by a green box).\n(A) bathroom cabinet\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828311_76504536507458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, desk (highlighted by a red box) or shopping basket (highlighted by a blue box)?\n(A) desk\n(B) shopping basket" }, { "from": "gpt", "value": "(B) shopping basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333308_28047349820250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from box (highlighted by a red box)? Select from appliance (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796358_10463347448750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) window\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898472_157199807781458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), pillow (highlighted by a blue box) or doormat (highlighted by a green box)?\n(A) pillow\n(B) doormat" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204341_14976905519958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to picture frame (highlighted by a red box)? Choose from lamp (highlighted by a blue box) and lamp (highlighted by a green box).\n(A) lamp\n(B) lamp" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670171_42351212115291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bowl (highlighted by a red box) or table (highlighted by a blue box)?\n(A) bowl\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331938_164839918632791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of handbag (annotated by the red box) in relation to round table?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261292_16296736002916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from furniture (highlighted by a red box)? Choose from lamp (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828562_102207771232750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, studio couch (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) studio couch\n(B) curtain" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649459_13914033482291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, fireplace (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) fireplace\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115222_95794739391416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, table (highlighted by a red box) or candle holder (highlighted by a blue box)?\n(A) table\n(B) candle holder" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261381_26870118174750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, furniture (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) furniture\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332184_262600622732833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to changing table (highlighted by a red box)? chest of drawers (highlighted by a blue box) or desk (highlighted by a green box).\n(A) chest of drawers\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115508_12358008024083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to chair (highlighted by a red box)? Choose from table (highlighted by a blue box) and chair (highlighted by a green box).\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897436_104960944744833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bath towel (highlighted by a red box) or hanger (highlighted by a blue box)?\n(A) bath towel\n(B) hanger" }, { "from": "gpt", "value": "(A) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649417_10155598632583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to book (highlighted by a red box)? Choose from bookcase (highlighted by a blue box) and window (highlighted by a green box).\n(A) bookcase\n(B) window" }, { "from": "gpt", "value": "(A) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895904_110659344695208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the curtain (highlighted by a red box)? Choose among these: nightstand (highlighted by a blue box) or book (highlighted by a green box).\n(A) nightstand\n(B) book" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739255_39615223591083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) chair\n(B) cabinetry" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204482_24632882491291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, door (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) door\n(B) studio couch" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895865_107658970568000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of picture frame (annotated by the red box) in reference to table lamp?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898959_821207691602958_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649605_36409825541541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from mirror (highlighted by a red box)? Select from furniture (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) furniture\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261108_1099050269249_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, appliance (highlighted by a red box) or book (highlighted by a blue box)?\n(A) appliance\n(B) book" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739474_52466527507000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the door (highlighted by a red box)? Choose among these: bath towel (highlighted by a blue box) or bathtub (highlighted by a green box).\n(A) bath towel\n(B) bathtub" }, { "from": "gpt", "value": "(B) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115358_4327807218332_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from studio couch (highlighted by a red box)? Choose among these: radiator (highlighted by a blue box) or basket (highlighted by a green box).\n(A) radiator\n(B) basket" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261713_1517933839208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bottle (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) bottle\n(B) appliance" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828504_102324063605208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chest of drawers (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) chest of drawers\n(B) fireplace" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895571_1153738433825291_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_4796197698041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to picture frame (highlighted by a red box), picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458706_136782060117207_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from vent (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458675_9319699857708_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899951_864779137972000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, window (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334040_279033907816289_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) furniture\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669939_15252929501166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from fireplace (highlighted by a red box)? houseplant (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) houseplant\n(B) picture frame" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358660_1045187860666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the picture frame (highlighted by a red box)? Choose among these: vase (highlighted by a blue box) or mirror (highlighted by a green box).\n(A) vase\n(B) mirror" }, { "from": "gpt", "value": "(A) vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444738_77984403375041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, door (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) door\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430544_300633238296291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to tap (highlighted by a red box)? Choose from bathtub (highlighted by a blue box) and bath mat (highlighted by a green box).\n(A) bathtub\n(B) bath mat" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828391_94895689560041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, towel bar (highlighted by a red box) or bathroom cabinet (highlighted by a blue box)?\n(A) towel bar\n(B) bathroom cabinet" }, { "from": "gpt", "value": "(B) bathroom cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828498_101736695087458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, door (highlighted by a red box) or window frame (highlighted by a blue box)?\n(A) door\n(B) window frame" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429762_356811950562000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, plant (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) plant\n(B) picture frame" }, { "from": "gpt", "value": "(A) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334205_103904475575375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260946_4663883345458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or window (highlighted by a blue box)?\n(A) chair\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261230_13413309325666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from refrigerator (highlighted by a red box)? Choose from kitchen appliance (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) kitchen appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333875_76098072594375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from tile (highlighted by a red box)? light switch (highlighted by a blue box) or screen door (highlighted by a green box)?\n(A) light switch\n(B) screen door" }, { "from": "gpt", "value": "(A) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662884_16479785950123_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of picture frame (annotated by the red box) and mirror in the image provided, where is picture frame (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739261_40050488384000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the stool (highlighted by a red box)? power outlet (highlighted by a blue box) or door (highlighted by a green box).\n(A) power outlet\n(B) door" }, { "from": "gpt", "value": "(A) power outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897509_472294407065041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, box (highlighted by a red box) or box (highlighted by a blue box)?\n(A) box\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430857_74506084875250_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018071_98135074453041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, toiletry (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) toiletry\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897490_471184817958833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, tea pot (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) tea pot\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332705_109814822662500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) door\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261158_662904440333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from fireplace (highlighted by a red box)? picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332401_406009472099625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to cabinetry (highlighted by a red box)? Choose from houseplant (highlighted by a blue box) and laptop (highlighted by a green box).\n(A) houseplant\n(B) laptop" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358118_62505290909666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447205_209341260913166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, towel rack (highlighted by a red box) or towel rack (highlighted by a blue box)?\n(A) towel rack\n(B) towel rack" }, { "from": "gpt", "value": "(B) towel rack" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332818_48822805672166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, curtain (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) curtain\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458315_102399147036000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), studio couch (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898500_159990184074833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, shelf (highlighted by a red box) or door (highlighted by a blue box)?\n(A) shelf\n(B) door" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430246_182507578817208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, book (highlighted by a red box) or bookcase (highlighted by a blue box)?\n(A) book\n(B) bookcase" }, { "from": "gpt", "value": "(B) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332106_683044009275666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, slate (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) slate\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358673_883085298458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, sink (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) sink\n(B) appliance" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662886_16423691520833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from mat (highlighted by a red box)? Choose from table (highlighted by a blue box) and fireplace (highlighted by a green box).\n(A) table\n(B) fireplace" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445597_284990738963375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhere is chest of drawers (annotated by the red box) located in relation to curtain in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018537_828113641492000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, table (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649720_48008953158000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261275_14271246274208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or mirror (highlighted by a blue box)?\n(A) picture frame\n(B) mirror" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895279_79247914178750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, houseplant (highlighted by a red box) or flower (highlighted by a blue box)?\n(A) houseplant\n(B) flower" }, { "from": "gpt", "value": "(B) flower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332025_202686398190875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, exhaust hood (highlighted by a red box) or window (highlighted by a blue box)?\n(A) exhaust hood\n(B) window" }, { "from": "gpt", "value": "(A) exhaust hood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331378_198323086410958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) window\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444904_106221552698166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, radiator (highlighted by a red box) or magazine (highlighted by a blue box)?\n(A) radiator\n(B) magazine" }, { "from": "gpt", "value": "(B) magazine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333659_130382175701833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from toy (highlighted by a red box)? Select from furniture (highlighted by a blue box) and cardboard box (highlighted by a green box).\n(A) furniture\n(B) cardboard box" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204739_24131843866958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, window (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899271_883779103294541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to toiletry (highlighted by a red box)? Choose from mirror (highlighted by a blue box) and shower curtain (highlighted by a green box).\n(A) mirror\n(B) shower curtain" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445677_61054016398791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, book (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) book\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445736_64099491362458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of stairs (annotated by the red box) in relation to furniture? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018278_794908780771166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cabinetry (highlighted by a red box) or countertop (highlighted by a blue box)?\n(A) cabinetry\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897780_129213527884333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895946_109213725684083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, sink (highlighted by a red box) or cage (highlighted by a blue box)?\n(A) sink\n(B) cage" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899030_643047777061458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, swivel chair (highlighted by a red box) or swivel chair (highlighted by a blue box)?\n(A) swivel chair\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897859_529540171069083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or hanger (highlighted by a blue box)?\n(A) door\n(B) hanger" }, { "from": "gpt", "value": "(B) hanger" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204303_15027570277583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from picture frame (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and table (highlighted by a green box).\n(A) studio couch\n(B) table" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332204_264166573371958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or window (highlighted by a blue box)?\n(A) chair\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898510_160649690474583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bookcase (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) bookcase\n(B) chair" }, { "from": "gpt", "value": "(A) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897939_351271213729333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the window screen (highlighted by a red box)? window (highlighted by a blue box) or plant (highlighted by a green box).\n(A) window\n(B) plant" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898696_580857682620541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is table (annotated by the red box) located relative to screen door? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662829_15199606358208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from cabinetry (highlighted by a red box)? Select from vent (highlighted by a blue box) and countertop (highlighted by a green box).\n(A) vent\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446492_356603052721041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from clock (highlighted by a red box)? table (highlighted by a blue box) or crate (highlighted by a green box)?\n(A) table\n(B) crate" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332311_387801945084708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, toiletry (highlighted by a red box) or towel (highlighted by a blue box)?\n(A) toiletry\n(B) towel" }, { "from": "gpt", "value": "(B) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333168_44172969732708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to desk (highlighted by a red box)? Select from laptop (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) laptop\n(B) cabinetry" }, { "from": "gpt", "value": "(A) laptop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018062_718707135279166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to light fixture (highlighted by a red box)? light fixture (highlighted by a blue box) or glass door (highlighted by a green box).\n(A) light fixture\n(B) glass door" }, { "from": "gpt", "value": "(A) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445771_64309376574041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window (highlighted by a red box)? Select from bed (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) bed\n(B) curtain" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458297_77411011110041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to bed (highlighted by a red box), pillow (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) pillow\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331346_192294509402125_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445794_64744351375750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from bathtub (highlighted by a red box)? Choose from towel bar (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) towel bar\n(B) screen door" }, { "from": "gpt", "value": "(A) towel bar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115131_85650144977375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to sink (highlighted by a red box)? Choose from bidet (highlighted by a blue box) and tap (highlighted by a green box).\n(A) bidet\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333826_53472846251333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from bottle (highlighted by a red box)? Choose from bottle (highlighted by a blue box) and toiletry (highlighted by a green box).\n(A) bottle\n(B) toiletry" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333649_126244012136541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, studio couch (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) studio couch\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332704_108382957429166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, shaving cream (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) shaving cream\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358341_15069219483916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, lamp (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) lamp\n(B) chair" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431173_352485576068166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, sink (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) sink\n(B) bath mat" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796575_16951172023500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of furniture (annotated by the red box) in relation to stove? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429835_748711930670708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, box (highlighted by a red box) or storage box (highlighted by a blue box)?\n(A) box\n(B) storage box" }, { "from": "gpt", "value": "(B) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897537_473589383070458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bed (highlighted by a red box)? dresser (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) dresser\n(B) pillow" }, { "from": "gpt", "value": "(A) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445931_79351374114833_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204670_12419141194791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the chest of drawers (highlighted by a red box)? Choose among these: television (highlighted by a blue box) or stove (highlighted by a green box).\n(A) television\n(B) stove" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261490_41866369296791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, studio couch (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) studio couch\n(B) curtain" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331711_11313721260750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, sink (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) sink\n(B) appliance" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896010_137042564580458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, stove (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) stove\n(B) doormat" }, { "from": "gpt", "value": "(B) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445078_5602216293208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, book (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) book\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430221_180247401315416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204305_15338274431041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from picture frame (highlighted by a red box), stool (highlighted by a blue box) or bookcase (highlighted by a green box)?\n(A) stool\n(B) bookcase" }, { "from": "gpt", "value": "(B) bookcase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115352_4061001559708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of cupboard (annotated by the red box) in relation to fireplace?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445684_61849665292541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, furniture (highlighted by a red box) or door (highlighted by a blue box)?\n(A) furniture\n(B) door" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897455_469621471792333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is throw pillow (annotated by the red box) located relative to pillow?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358660_976898210541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to lamp (highlighted by a red box)? Select from lamp (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) lamp\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895571_1153714443476000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, appliance (highlighted by a red box) or faucet (highlighted by a blue box)?\n(A) appliance\n(B) faucet" }, { "from": "gpt", "value": "(B) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895943_107787125857333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, floral arrangement (highlighted by a red box) or door (highlighted by a blue box)?\n(A) floral arrangement\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662835_15873642957500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: studio couch (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) studio couch\n(B) picture frame" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333003_128405505164333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the clothing (highlighted by a red box)? clothing (highlighted by a blue box) or clothing (highlighted by a green box).\n(A) clothing\n(B) clothing" }, { "from": "gpt", "value": "(A) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331627_20076046281958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, gas stove (highlighted by a red box) or gas stove (highlighted by a blue box)?\n(A) gas stove\n(B) gas stove" }, { "from": "gpt", "value": "(A) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429773_359939726575708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or lamp (highlighted by a green box).\n(A) picture frame\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739305_43529971314625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from bowl (highlighted by a red box)? Choose from clock (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) clock\n(B) cabinetry" }, { "from": "gpt", "value": "(A) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898622_757633106359083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, toilet (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) toilet\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739902_15082073391291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018608_633232514482625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the table (highlighted by a red box)? studio couch (highlighted by a blue box) or couch (highlighted by a green box).\n(A) studio couch\n(B) couch" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261681_3608744764375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) picture frame\n(B) cabinetry" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204670_12411144355250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, shelf (highlighted by a red box) or book (highlighted by a blue box)?\n(A) shelf\n(B) book" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204474_25057580975666_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446140_141007968848291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, paperback book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) paperback book\n(B) book" }, { "from": "gpt", "value": "(A) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334147_142757225488208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, cabinet (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) cabinet\n(B) picture frame" }, { "from": "gpt", "value": "(A) cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331684_6477096043041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from nightstand (highlighted by a red box)? Choose among these: chest of drawers (highlighted by a blue box) or window screen (highlighted by a green box).\n(A) chest of drawers\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115649_4928248845125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663313_76586278483791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, glass door (highlighted by a red box) or mirror (highlighted by a blue box)?\n(A) glass door\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332080_251462522070666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of toilet (annotated by the red box) in relation to curtain?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333122_115476898026375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toilet paper (highlighted by a red box) or toilet (highlighted by a blue box)?\n(A) toilet paper\n(B) toilet" }, { "from": "gpt", "value": "(B) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331491_153060015889083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, computer monitor (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) computer monitor\n(B) picture frame" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204836_452646246375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334729_535896133096499_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from music stool (highlighted by a red box)? Select from houseplant (highlighted by a blue box) and window sill (highlighted by a green box).\n(A) houseplant\n(B) window sill" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458231_78610002066041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to gas stove (highlighted by a red box), cupboard (highlighted by a blue box) or electric outlet (highlighted by a green box)?\n(A) cupboard\n(B) electric outlet" }, { "from": "gpt", "value": "(A) cupboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649614_37032169696750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, light fixture (highlighted by a red box) or backdrop (highlighted by a blue box)?\n(A) light fixture\n(B) backdrop" }, { "from": "gpt", "value": "(B) backdrop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898587_184505773212208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to chair (highlighted by a red box), chair (highlighted by a blue box) or table (highlighted by a green box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430982_101724821194291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, doormat (highlighted by a red box) or plywood (highlighted by a blue box)?\n(A) doormat\n(B) plywood" }, { "from": "gpt", "value": "(B) plywood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260892_8853997534875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, counter top (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) counter top\n(B) cleaning product" }, { "from": "gpt", "value": "(A) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358471_46571972470208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, television (highlighted by a red box) or remote control (highlighted by a blue box)?\n(A) television\n(B) remote control" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261332_24041128887041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from pillow (highlighted by a red box)? Choose among these: bed (highlighted by a blue box) or door (highlighted by a green box).\n(A) bed\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204852_1543524312000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to shower (highlighted by a red box), shower (highlighted by a blue box) or shower (highlighted by a green box)?\n(A) shower\n(B) shower" }, { "from": "gpt", "value": "(A) shower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334273_157201262132000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from window screen (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) cabinetry\n(B) screen door" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895192_38405224960000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, screen door (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) screen door\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670356_67363487214541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or door (highlighted by a blue box)?\n(A) curtain\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430608_315205620819166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, square (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) square\n(B) furniture" }, { "from": "gpt", "value": "(A) square" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261358_25895521892833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, sink (highlighted by a red box) or countertop (highlighted by a blue box)?\n(A) sink\n(B) countertop" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895245_75690990957833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, paperback book (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) paperback book\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333319_28354541280833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the cabinetry (highlighted by a red box)? appliance (highlighted by a blue box) or kitchen appliance (highlighted by a green box).\n(A) appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899483_955269317748333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, air conditioning (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) air conditioning\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261556_75640875446000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from cabinetry (highlighted by a red box)? Select from home appliance (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) home appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018760_15103451919958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or picnic basket (highlighted by a blue box)?\n(A) chair\n(B) picnic basket" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332195_263804840971081_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is laundry (annotated by the red box) located relative to pouch?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11205703221833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from bookcase (highlighted by a red box)? Select from table (highlighted by a blue box) and tableware (highlighted by a green box).\n(A) table\n(B) tableware" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445716_63667906311625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of sink (annotated by the red box) and mouthwash in the image provided, where is sink (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446479_355570760249458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the chair (highlighted by a red box)? bean bag chair (highlighted by a blue box) or clothing (highlighted by a green box).\n(A) bean bag chair\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898439_2661245468166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) door\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663322_77693663474375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, sink (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) sink\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669896_11114698886666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, coffee table (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) coffee table\n(B) window screen" }, { "from": "gpt", "value": "(A) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332653_369019075168166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of television (annotated by the red box) in reference to cabinetry? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739344_46028721665500_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899491_197838144753583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899263_883253305430333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018883_653726172049000_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331589_15949279724250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from book (highlighted by a red box), bed (highlighted by a blue box) or toy (highlighted by a green box)?\n(A) bed\n(B) toy" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458640_128056381213791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) furniture\n(B) curtain" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018150_372925684426416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, table (highlighted by a red box) or piano (highlighted by a blue box)?\n(A) table\n(B) piano" }, { "from": "gpt", "value": "(B) piano" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897732_115055403561875_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332183_262770320641166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, shelf (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) shelf\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018600_632548599025250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, houseplant (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) houseplant\n(B) curtain" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334284_161095336822333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, screen door (highlighted by a red box) or window (highlighted by a blue box)?\n(A) screen door\n(B) window" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018757_14938951720750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, light switch (highlighted by a red box) or door (highlighted by a blue box)?\n(A) light switch\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828369_92353016428958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662884_16529782825875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to changing table (highlighted by a red box)? Select from furniture (highlighted by a blue box) and mat (highlighted by a green box).\n(A) furniture\n(B) mat" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897479_112550741831041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, counter top (highlighted by a red box) or mirror (highlighted by a blue box)?\n(A) counter top\n(B) mirror" }, { "from": "gpt", "value": "(A) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895459_130511011911083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of furniture (annotated by the red box) in reference to paper? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115165_88156284513375_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from screen door (highlighted by a red box)? radiator (highlighted by a blue box) or door (highlighted by a green box)?\n(A) radiator\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115394_3354860802333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of table (annotated by the red box) in reference to furniture?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662891_19497497983083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, stationary bicycle (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) stationary bicycle\n(B) glass door" }, { "from": "gpt", "value": "(A) stationary bicycle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446492_356625060383416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from kitchen appliance (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or bath towel (highlighted by a green box).\n(A) appliance\n(B) bath towel" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331177_277401901989458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to door (highlighted by a red box)? Choose from armchair (highlighted by a blue box) and chair (highlighted by a green box).\n(A) armchair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649478_15083137376416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, lamp (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) lamp\n(B) radiator" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334961_667569284353750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from book (highlighted by a red box), book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333268_21962314227166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, paper plate (highlighted by a red box) or platter (highlighted by a blue box)?\n(A) paper plate\n(B) platter" }, { "from": "gpt", "value": "(B) platter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430978_101756924791541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from mirror (highlighted by a red box)? Select from screen door (highlighted by a blue box) and door (highlighted by a green box).\n(A) screen door\n(B) door" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333494_62245703875458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window screen (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) window screen\n(B) window screen" }, { "from": "gpt", "value": "(A) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896188_141867419420500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from droplight (highlighted by a red box)? Select from window (highlighted by a blue box) and door (highlighted by a green box).\n(A) window\n(B) door" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334912_1089986468708375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895679_370075952474500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, fridge (highlighted by a red box) or table (highlighted by a blue box)?\n(A) fridge\n(B) table" }, { "from": "gpt", "value": "(A) fridge" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828441_91474325564875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, table lamp (highlighted by a red box) or lighting (highlighted by a blue box)?\n(A) table lamp\n(B) lighting" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430931_92859385351125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from person (highlighted by a red box)? lamp (highlighted by a blue box) or person (highlighted by a green box)?\n(A) lamp\n(B) person" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896365_19867845396791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from kitchen appliance (highlighted by a red box)? picnic table (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) picnic table\n(B) appliance" }, { "from": "gpt", "value": "(A) picnic table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663064_38456495992833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, electric outlet (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) electric outlet\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447287_408826596953875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, appliance (highlighted by a red box) or dresser (highlighted by a blue box)?\n(A) appliance\n(B) dresser" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334559_68604628585415_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from window (highlighted by a red box)? Choose among these: curtain (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) curtain\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017829_696866873185416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cardboard box (highlighted by a red box)? Choose from radiator (highlighted by a blue box) and bulletin board (highlighted by a green box).\n(A) radiator\n(B) bulletin board" }, { "from": "gpt", "value": "(B) bulletin board" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895593_1161484186474083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, cabinetry (highlighted by a red box) or plant (highlighted by a blue box)?\n(A) cabinetry\n(B) plant" }, { "from": "gpt", "value": "(B) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333031_59010826470416_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204341_14988900777416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the basket (highlighted by a red box)? Choose among these: radiator (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) radiator\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828476_100597047380208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, appliance (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) appliance\n(B) bottle" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331615_18081983911125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, curtain (highlighted by a red box) or window (highlighted by a blue box)?\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446485_355888347063791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from speaker (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and animal (highlighted by a green box).\n(A) furniture\n(B) animal" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796752_29816755513916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, furniture (highlighted by a red box) or wheel (highlighted by a blue box)?\n(A) furniture\n(B) wheel" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331491_153078025231958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from picture frame (highlighted by a red box), television (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) television\n(B) shelf" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204387_23098485697208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from computer monitor (highlighted by a red box)? printer (highlighted by a blue box) or door (highlighted by a green box)?\n(A) printer\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115118_84673835196708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window (highlighted by a red box), cabinetry (highlighted by a blue box) or television (highlighted by a green box)?\n(A) cabinetry\n(B) television" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898729_583554568231291_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895826_1220011667431833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bed (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) bed\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649643_40411130442416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from toilet paper (highlighted by a red box)? Choose among these: basket (highlighted by a blue box) or window sill (highlighted by a green box).\n(A) basket\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458283_76329545358666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to pillow (highlighted by a red box)? pillow (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) pillow\n(B) studio couch" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332696_107028302999916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to window (highlighted by a red box)? lighting (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) lighting\n(B) picture frame" }, { "from": "gpt", "value": "(A) lighting" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358731_6711814014416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from dresser (highlighted by a red box), furniture (highlighted by a blue box) or throw pillow (highlighted by a green box)?\n(A) furniture\n(B) throw pillow" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332046_208823932106333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from bath towel (highlighted by a red box)? tile (highlighted by a blue box) or bathtub (highlighted by a green box)?\n(A) tile\n(B) bathtub" }, { "from": "gpt", "value": "(A) tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739359_186949494610208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from porcelain (highlighted by a red box)? Choose from toilet paper (highlighted by a blue box) and toilet paper (highlighted by a green box).\n(A) toilet paper\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42923207_1819199636583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to brush (highlighted by a red box), desk (highlighted by a blue box) or swivel chair (highlighted by a green box)?\n(A) desk\n(B) swivel chair" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444758_80905955114583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from pillow (highlighted by a red box)? Choose among these: nightstand (highlighted by a blue box) or door (highlighted by a green box).\n(A) nightstand\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261219_13588819904625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from bottle (highlighted by a red box)? Select from vent (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) vent\n(B) appliance" }, { "from": "gpt", "value": "(A) vent" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261688_350441675541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) chair\n(B) paperback book" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334037_278592920507166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bookshelf (highlighted by a red box)? Choose among these: screen door (highlighted by a blue box) or door (highlighted by a green box).\n(A) screen door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358698_3044725012125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chest of drawers (highlighted by a red box) or vase (highlighted by a blue box)?\n(A) chest of drawers\n(B) vase" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334515_64446265782333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, towel/napkin (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) towel/napkin\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333139_40058976361291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to computer monitor (highlighted by a red box)? Select from computer (highlighted by a blue box) and desk (highlighted by a green box).\n(A) computer\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663064_38516488927166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, studio couch (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) studio couch\n(B) curtain" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332195_263840943030500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from bottle (highlighted by a red box), bottle (highlighted by a blue box) or counter (highlighted by a green box)?\n(A) bottle\n(B) counter" }, { "from": "gpt", "value": "(B) counter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796730_28597276082791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from picture frame (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739933_16693613510874_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toilet bowl (highlighted by a red box) or soap (highlighted by a blue box)?\n(A) toilet bowl\n(B) soap" }, { "from": "gpt", "value": "(B) soap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897859_529538171886625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, list (highlighted by a red box) or handbag (highlighted by a blue box)?\n(A) list\n(B) handbag" }, { "from": "gpt", "value": "(B) handbag" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334756_421257808416041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to countertop (highlighted by a red box)? bottle (highlighted by a blue box) or food (highlighted by a green box).\n(A) bottle\n(B) food" }, { "from": "gpt", "value": "(B) food" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204303_14983571830958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) chair\n(B) curtain" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331343_192413411139416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to couch (highlighted by a red box)? Select from window (highlighted by a blue box) and window sill (highlighted by a green box).\n(A) window\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429717_18197233608583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to bowl (highlighted by a red box), coffee maker (highlighted by a blue box) or power plugs and sockets (highlighted by a green box)?\n(A) coffee maker\n(B) power plugs and sockets" }, { "from": "gpt", "value": "(A) coffee maker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204724_23494515531708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from couch (highlighted by a red box)? Select from chest of drawers (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) chest of drawers\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898984_824263394624041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the pillow (highlighted by a red box)? pillow (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897892_345138502537625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, flag (highlighted by a red box) or flag (highlighted by a blue box)?\n(A) flag\n(B) flag" }, { "from": "gpt", "value": "(B) flag" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444709_74167304785666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the path (highlighted by a red box)? concrete (highlighted by a blue box) or door (highlighted by a green box).\n(A) concrete\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828552_101522721297125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) chair\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662912_19991754481500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444735_77921096039041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to glass door (highlighted by a red box)? Choose from houseplant (highlighted by a blue box) and door (highlighted by a green box).\n(A) houseplant\n(B) door" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828390_94716597024708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, screen door (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) screen door\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331283_14120298124541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, shelf (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) shelf\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358362_16327257705333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896527_34728925894333_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bottle (highlighted by a red box)? bottle (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458262_74193137964041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, tripod (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) tripod\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447275_408653601542958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the toy (highlighted by a red box)? toy (highlighted by a blue box) or toy (highlighted by a green box).\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(A) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458704_136676868476250_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332204_264233179729291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, toy (highlighted by a red box) or couch (highlighted by a blue box)?\n(A) toy\n(B) couch" }, { "from": "gpt", "value": "(B) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115131_85661556921500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from mouthwash (highlighted by a red box)? Choose among these: cleaning product (highlighted by a blue box) or ledge (highlighted by a green box).\n(A) cleaning product\n(B) ledge" }, { "from": "gpt", "value": "(B) ledge" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333847_75016225683750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, picture frame (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) picture frame\n(B) shelf" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649804_46725095094916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to lamp (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261344_24361538668083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to door (highlighted by a red box)? Choose from chair (highlighted by a blue box) and door (highlighted by a green box).\n(A) chair\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261686_3839948934041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the picture frame (highlighted by a red box)? lamp (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896089_143928099662541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from chair (highlighted by a red box)? Choose among these: gas stove (highlighted by a blue box) or table (highlighted by a green box).\n(A) gas stove\n(B) table" }, { "from": "gpt", "value": "(A) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896169_140673516548958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, lamp (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) lamp\n(B) desk" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331084_133972982302041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from door (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or magazine (highlighted by a green box).\n(A) door\n(B) magazine" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018634_635972677203125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from studio couch (highlighted by a red box)? Choose from curtain (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) curtain\n(B) pillow" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332049_208997728374875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is window (annotated by the red box) located relative to infant bed? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895272_79414313214750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the cabinetry (highlighted by a red box)? chair (highlighted by a blue box) or table (highlighted by a green box).\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331541_7061814638333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, teddy bear (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) teddy bear\n(B) pillow" }, { "from": "gpt", "value": "(A) teddy bear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796692_30746248978291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, footwear (highlighted by a red box) or shoe (highlighted by a blue box)?\n(A) footwear\n(B) shoe" }, { "from": "gpt", "value": "(B) shoe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333325_29495821350291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to clothing (highlighted by a red box)? Choose from blanket (highlighted by a blue box) and swivel chair (highlighted by a green box).\n(A) blanket\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261281_14432549109708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from pillow (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and table lamp (highlighted by a green box).\n(A) picture frame\n(B) table lamp" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895868_107592764631083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017887_80070913636833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, rocking chair (highlighted by a red box) or armchair (highlighted by a blue box)?\n(A) rocking chair\n(B) armchair" }, { "from": "gpt", "value": "(B) armchair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018808_19401781523541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) chair\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358118_62573396058791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, sink (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) sink\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739844_17139117957125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to dresser (highlighted by a red box), mat (highlighted by a blue box) or studio couch (highlighted by a green box)?\n(A) mat\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261728_2866292848416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bowl (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) bowl\n(B) cabinetry" }, { "from": "gpt", "value": "(A) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670075_38527517351333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window (highlighted by a red box) or window (highlighted by a blue box)?\n(A) window\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429738_19889967562791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from footwear (highlighted by a red box)? footwear (highlighted by a blue box) or footwear (highlighted by a green box)?\n(A) footwear\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331027_474601820225500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from mug (highlighted by a red box)? gas stove (highlighted by a blue box) or kitchen appliance (highlighted by a green box)?\n(A) gas stove\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261601_52864894258041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333590_208835790341833_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, sink (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) sink\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332079_251384920111541_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017894_80938144834333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, cabinetry (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) cabinetry\n(B) bath mat" }, { "from": "gpt", "value": "(B) bath mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828552_101504711755208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, step stool (highlighted by a red box) or step stool (highlighted by a blue box)?\n(A) step stool\n(B) step stool" }, { "from": "gpt", "value": "(A) step stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670149_40621637662250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bottle (highlighted by a red box)? Select from bottle (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) bottle\n(B) picture frame" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334672_391446105965166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, waste container (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) waste container\n(B) concrete" }, { "from": "gpt", "value": "(A) waste container" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895448_129443294287166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, towel (highlighted by a red box) or towel (highlighted by a blue box)?\n(A) towel\n(B) towel" }, { "from": "gpt", "value": "(A) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430441_814248952750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the kitchen appliance (highlighted by a red box)? grapefruit (highlighted by a blue box) or apple (highlighted by a green box).\n(A) grapefruit\n(B) apple" }, { "from": "gpt", "value": "(A) grapefruit" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261378_27078618976166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to stationary bicycle (highlighted by a red box), dumbbell (highlighted by a blue box) or window screen (highlighted by a green box)?\n(A) dumbbell\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897605_137307638256125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to curtain (highlighted by a red box), window (highlighted by a blue box) or window sill (highlighted by a green box)?\n(A) window\n(B) window sill" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204271_12680465876083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the picture frame (highlighted by a red box)? Choose among these: window (highlighted by a blue box) or mirror (highlighted by a green box).\n(A) window\n(B) mirror" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897547_473220102463333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or blanket (highlighted by a blue box)?\n(A) furniture\n(B) blanket" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018846_649901719848208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897928_348904445454208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, countertop (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) countertop\n(B) bottle" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430713_335329216112500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chair (highlighted by a red box)? radiator (highlighted by a blue box) or doormat (highlighted by a green box)?\n(A) radiator\n(B) doormat" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358406_40713378848291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to gas stove (highlighted by a red box), bottle (highlighted by a blue box) or paper towel (highlighted by a green box)?\n(A) bottle\n(B) paper towel" }, { "from": "gpt", "value": "(B) paper towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445938_79460563299416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, shelf (highlighted by a red box) or door (highlighted by a blue box)?\n(A) shelf\n(B) door" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445677_61050018061791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to book (highlighted by a red box), book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115501_12499918556458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to studio couch (highlighted by a red box)? table (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358617_552706739375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to door (highlighted by a red box), mat (highlighted by a blue box) or boot (highlighted by a green box)?\n(A) mat\n(B) boot" }, { "from": "gpt", "value": "(B) boot" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898349_509483011939916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bathtub (highlighted by a red box) or cleaning product (highlighted by a blue box)?\n(A) bathtub\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446608_210339297748041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, closet (highlighted by a red box) or closet (highlighted by a blue box)?\n(A) closet\n(B) closet" }, { "from": "gpt", "value": "(A) closet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204795_24271841443750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to blanket (highlighted by a red box)? cabinetry (highlighted by a blue box) or bird cage (highlighted by a green box).\n(A) cabinetry\n(B) bird cage" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333125_115562396632875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, laundry (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) laundry\n(B) screen door" }, { "from": "gpt", "value": "(A) laundry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445720_59030880788333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the appliance (highlighted by a red box)? Choose among these: bottle (highlighted by a blue box) or basin (highlighted by a green box).\n(A) bottle\n(B) basin" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331793_10261092752125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, basket (highlighted by a red box) or square (highlighted by a blue box)?\n(A) basket\n(B) square" }, { "from": "gpt", "value": "(A) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429798_737372429790500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, table (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) table\n(B) radiator" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899935_863180980503791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, appliance (highlighted by a red box) or window (highlighted by a blue box)?\n(A) appliance\n(B) window" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334767_424049834356916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, soap dispenser (highlighted by a red box) or toothbrush (highlighted by a blue box)?\n(A) soap dispenser\n(B) toothbrush" }, { "from": "gpt", "value": "(A) soap dispenser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430294_187603952355250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, floral arrangement (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) floral arrangement\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333055_60308483164208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to shelf (highlighted by a red box)? houseplant (highlighted by a blue box) or book (highlighted by a green box).\n(A) houseplant\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261263_13869304814500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from counter top (highlighted by a red box), window sill (highlighted by a blue box) or toilet (highlighted by a green box)?\n(A) window sill\n(B) toilet" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115362_834062926041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to curtain (highlighted by a red box)? pillow (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) pillow\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358167_60825933161916_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895199_39486122413250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, studio couch (highlighted by a red box) or blanket (highlighted by a blue box)?\n(A) studio couch\n(B) blanket" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334935_663048898909833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, door (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) door\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332396_401302808500666_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, curtain (highlighted by a red box) or window (highlighted by a blue box)?\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895493_450859870852083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from book (highlighted by a red box)? Choose among these: houseplant (highlighted by a blue box) or book (highlighted by a green box).\n(A) houseplant\n(B) book" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895917_111337841060583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to table (highlighted by a red box)? Select from wine bottle (highlighted by a blue box) and mouthwash (highlighted by a green box).\n(A) wine bottle\n(B) mouthwash" }, { "from": "gpt", "value": "(B) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899640_231838093057291_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331144_179481294150750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from desk (highlighted by a red box)? chair (highlighted by a blue box) or book (highlighted by a green box)?\n(A) chair\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895571_1153716442672208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649727_49005304386125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, mirror (highlighted by a red box) or window sill (highlighted by a blue box)?\n(A) mirror\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895911_111486845851208_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331938_164863025932958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bed (highlighted by a red box) or cloth (highlighted by a blue box)?\n(A) bed\n(B) cloth" }, { "from": "gpt", "value": "(B) cloth" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115358_4287807243915_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bedding (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739281_42576764219291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, desk (highlighted by a red box) or laptop (highlighted by a blue box)?\n(A) desk\n(B) laptop" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333298_26658434543583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from houseplant (highlighted by a red box)? Select from cleaning product (highlighted by a blue box) and toilet paper (highlighted by a green box).\n(A) cleaning product\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430694_327495285609708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bathtub (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) bathtub\n(B) ceramic tile" }, { "from": "gpt", "value": "(B) ceramic tile" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333249_33627818257125_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898334_506650977699458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is pillow (annotated by the red box) located relative to pillow? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334052_85568540439666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to beach towel (highlighted by a red box)? Select from microwave oven (highlighted by a blue box) and beach towel (highlighted by a green box).\n(A) microwave oven\n(B) beach towel" }, { "from": "gpt", "value": "(B) beach towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458561_128021217722875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, screen door (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) screen door\n(B) doormat" }, { "from": "gpt", "value": "(B) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445168_7988531316500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to window (highlighted by a red box)? curtain (highlighted by a blue box) or light fixture (highlighted by a green box).\n(A) curtain\n(B) light fixture" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649612_36508417991458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the dresser (highlighted by a red box)? table lamp (highlighted by a blue box) or nightstand (highlighted by a green box).\n(A) table lamp\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896515_33540771053500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, platter (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) platter\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895910_110942543721625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table lamp (highlighted by a red box) or tripod (highlighted by a blue box)?\n(A) table lamp\n(B) tripod" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204289_14380396245083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to appliance (highlighted by a red box), clock (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) clock\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331002_178703932109291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) door\n(B) cabinetry" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828369_92300921315208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from table (highlighted by a red box)? Choose among these: doormat (highlighted by a blue box) or fireplace (highlighted by a green box).\n(A) doormat\n(B) fireplace" }, { "from": "gpt", "value": "(A) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115143_87152978008875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to cabinetry (highlighted by a red box)? Select from kitchen appliance (highlighted by a blue box) and electric outlet (highlighted by a green box).\n(A) kitchen appliance\n(B) electric outlet" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896589_32979538374000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from washing machine (highlighted by a red box), washing machine (highlighted by a blue box) or basket (highlighted by a green box)?\n(A) washing machine\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333618_76343631860375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to picture frame (highlighted by a red box)? Select from animal (highlighted by a blue box) and animal (highlighted by a green box).\n(A) animal\n(B) animal" }, { "from": "gpt", "value": "(B) animal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333308_28025342059166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, microwave oven (highlighted by a red box) or coffee cup (highlighted by a blue box)?\n(A) microwave oven\n(B) coffee cup" }, { "from": "gpt", "value": "(A) microwave oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739313_44828006947333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261695_607756601916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, chair (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) chair\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663347_91344111473875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897418_103528288762500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from shelf (highlighted by a red box), shower door (highlighted by a blue box) or bath (highlighted by a green box)?\n(A) shower door\n(B) bath" }, { "from": "gpt", "value": "(A) shower door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739965_18661770503833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, television (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) television\n(B) toy" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796745_28716079069458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, piano (highlighted by a red box) or power outlet (highlighted by a blue box)?\n(A) piano\n(B) power outlet" }, { "from": "gpt", "value": "(B) power outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458330_102993718532208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from sink (highlighted by a red box)? appliance (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) appliance\n(B) bottle" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334499_63930051356166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, cabinetry (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) cabinetry\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358406_40695369639916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the countertop (highlighted by a red box)? Choose among these: notepad (highlighted by a blue box) or door (highlighted by a green box).\n(A) notepad\n(B) door" }, { "from": "gpt", "value": "(A) notepad" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429833_748655336857125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, box (highlighted by a red box) or box (highlighted by a blue box)?\n(A) box\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018286_799423421532875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, desk (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) desk\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458675_9305689027125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, extension cord (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) extension cord\n(B) radiator" }, { "from": "gpt", "value": "(A) extension cord" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261219_13528811480666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, exhaust hood (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) exhaust hood\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895287_80080851869708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, teddy (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) teddy\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334934_663209600413041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from chair (highlighted by a red box)? Choose among these: plant (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) plant\n(B) cabinetry" }, { "from": "gpt", "value": "(A) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331921_631010191847250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to flowerpot (highlighted by a red box)? Choose from flowerpot (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) flowerpot\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662908_20113753854500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, television (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) television\n(B) pillow" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828231_69996219037125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to computer monitor (highlighted by a red box), window (highlighted by a blue box) or table lamp (highlighted by a green box)?\n(A) window\n(B) table lamp" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017893_80847748091750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, countertop (highlighted by a red box) or food (highlighted by a blue box)?\n(A) countertop\n(B) food" }, { "from": "gpt", "value": "(B) food" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430928_92976171144708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bed (highlighted by a red box) or dresser (highlighted by a blue box)?\n(A) bed\n(B) dresser" }, { "from": "gpt", "value": "(B) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204786_27373568423250_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332469_886509269420083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) door\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899031_643142319980666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from christmas decoration (highlighted by a red box)? screen door (highlighted by a blue box) or christmas tree (highlighted by a green box)?\n(A) screen door\n(B) christmas tree" }, { "from": "gpt", "value": "(B) christmas tree" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899640_231861083913291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is cupboard (annotated by the red box) located in relation to cupboard in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895978_134657508916083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, toilet (highlighted by a red box) or mouthwash (highlighted by a blue box)?\n(A) toilet\n(B) mouthwash" }, { "from": "gpt", "value": "(B) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662884_16533781244708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458633_127536276490708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from basket (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and footwear (highlighted by a green box).\n(A) furniture\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358729_6590628685458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) picture frame\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897713_111876401354916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, cabinetry (highlighted by a red box) or material (highlighted by a blue box)?\n(A) cabinetry\n(B) material" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895871_489430472575875_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796446_633720852875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, lighting (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) lighting\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018832_649340750676083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, keyboard (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) keyboard\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828442_91428227170333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, studio couch (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) studio couch\n(B) chair" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445794_64762344206166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window sill (highlighted by a red box) or trash bin/can (highlighted by a blue box)?\n(A) window sill\n(B) trash bin/can" }, { "from": "gpt", "value": "(B) trash bin/can" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115118_84732544243125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, cabinetry (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) cabinetry\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796475_4308722876125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) chair\n(B) studio couch" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446479_355586753721208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, coffee table (highlighted by a red box) or notepad (highlighted by a blue box)?\n(A) coffee table\n(B) notepad" }, { "from": "gpt", "value": "(B) notepad" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333292_26367537732041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, houseplant (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) houseplant\n(B) bottle" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333624_77098070274291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to plant (highlighted by a red box), chair (highlighted by a blue box) or window screen (highlighted by a green box)?\n(A) chair\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018838_649243456783291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from cupboard (highlighted by a red box)? Select from curtain (highlighted by a blue box) and window screen (highlighted by a green box).\n(A) curtain\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332184_262568818937833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, shelf (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) shelf\n(B) shelf" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333031_58965328269958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, equipment (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) equipment\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333264_21841813301291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to window (highlighted by a red box)? Choose from tableware (highlighted by a blue box) and table (highlighted by a green box).\n(A) tableware\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332778_44611052466916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window frame (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) window frame\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899003_640663422572166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cupboard (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) cupboard\n(B) mat" }, { "from": "gpt", "value": "(A) cupboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331934_163631992726833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430269_185547619033625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of electric outlet (annotated by the red box) and door in the image provided, where is electric outlet (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898506_160897587644333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, nightstand (highlighted by a red box) or storage box (highlighted by a blue box)?\n(A) nightstand\n(B) storage box" }, { "from": "gpt", "value": "(B) storage box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458437_117575493796708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to gas stove (highlighted by a red box)? Select from appliance (highlighted by a blue box) and bath towel (highlighted by a green box).\n(A) appliance\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332563_905870837163541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333653_126316715935458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is furniture (annotated by the red box) located in relation to door in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670109_41035815490291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the vanity (highlighted by a red box)? glass door (highlighted by a blue box) or table (highlighted by a green box).\n(A) glass door\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899474_954137621152166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828150_73401402051500_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is cabinetry (annotated by the red box) located relative to cupboard? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445584_283393576933916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, door (highlighted by a red box) or postcard (highlighted by a blue box)?\n(A) door\n(B) postcard" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896089_143890098718708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the window sill (highlighted by a red box)? Choose among these: window screen (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) window screen\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334185_354538267914083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from kitchen appliance (highlighted by a red box)? kitchen appliance (highlighted by a blue box) or kitchen appliance (highlighted by a green box)?\n(A) kitchen appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115201_94428142615958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, table lamp (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) table lamp\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354695028277333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from shelf (highlighted by a red box)? desk (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) desk\n(B) cabinetry" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898681_576419180862125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toilet paper (highlighted by a red box) or towel (highlighted by a blue box)?\n(A) toilet paper\n(B) towel" }, { "from": "gpt", "value": "(B) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899955_865584556947583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, dresser (highlighted by a red box) or table (highlighted by a blue box)?\n(A) dresser\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332083_251916478417125_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669980_28865287745625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to table (highlighted by a red box)? picture frame (highlighted by a blue box) or swivel chair (highlighted by a green box).\n(A) picture frame\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334917_1090074366633707_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to oven (highlighted by a red box), cabinetry (highlighted by a blue box) or robe (highlighted by a green box)?\n(A) cabinetry\n(B) robe" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331421_544115131493457_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), table top (highlighted by a blue box) or laptop (highlighted by a green box)?\n(A) table top\n(B) laptop" }, { "from": "gpt", "value": "(B) laptop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332751_42613714094875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, houseplant (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) houseplant\n(B) appliance" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018704_545502569478665_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, countertop (highlighted by a red box) or window (highlighted by a blue box)?\n(A) countertop\n(B) window" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897722_114306641747041_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663363_91198702332958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to lamp (highlighted by a red box)? Choose from table (highlighted by a blue box) and concrete (highlighted by a green box).\n(A) table\n(B) concrete" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204820_28625219803166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of mirror (annotated by the red box) and bedding in the image provided, where is mirror (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333040_59752249930416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the table (highlighted by a red box)? bottle (highlighted by a blue box) or chair (highlighted by a green box).\n(A) bottle\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430854_74242490006666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bean bag chair (highlighted by a red box)? mirror (highlighted by a blue box) or table (highlighted by a green box).\n(A) mirror\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332939_19422769120750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897954_533749623582958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898899_816878739064583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, paper plate (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) paper plate\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898621_758006202955208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cleaning product (highlighted by a red box)? Choose from cleaning product (highlighted by a blue box) and cleaning product (highlighted by a green box).\n(A) cleaning product\n(B) cleaning product" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897409_102977183281083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from appliance (highlighted by a red box)? Select from appliance (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332316_390881069646083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) cabinetry\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895863_107876163923208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chair (highlighted by a red box)? dog (highlighted by a blue box) or coffee table (highlighted by a green box)?\n(A) dog\n(B) coffee table" }, { "from": "gpt", "value": "(A) dog" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898057_223615645475041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bathtub (highlighted by a red box)? Select from garbage (highlighted by a blue box) and door (highlighted by a green box).\n(A) garbage\n(B) door" }, { "from": "gpt", "value": "(A) garbage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331934_163512691087875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, laptop (highlighted by a red box) or table (highlighted by a blue box)?\n(A) laptop\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204493_26370431288541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from screen door (highlighted by a red box), toilet paper (highlighted by a blue box) or bathtub (highlighted by a green box)?\n(A) toilet paper\n(B) bathtub" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662805_13535980270625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, star (highlighted by a red box) or table (highlighted by a blue box)?\n(A) star\n(B) table" }, { "from": "gpt", "value": "(A) star" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332759_43362224370541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, cleaning product (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) cleaning product\n(B) toiletry" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261515_43712337354166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window (highlighted by a red box) or droplight (highlighted by a blue box)?\n(A) window\n(B) droplight" }, { "from": "gpt", "value": "(B) droplight" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261294_16238842218000_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from chest of drawers (highlighted by a red box)? window (highlighted by a blue box) or television (highlighted by a green box)?\n(A) window\n(B) television" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896043_130147040261708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from lighting (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or door (highlighted by a green box).\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895298_90989131360416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, furniture (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) furniture\n(B) counter top" }, { "from": "gpt", "value": "(B) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334713_533802581754333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, book (highlighted by a red box) or file cabinet (highlighted by a blue box)?\n(A) book\n(B) file cabinet" }, { "from": "gpt", "value": "(B) file cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896160_139930081516875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, sink (highlighted by a red box) or toothpaste (highlighted by a blue box)?\n(A) sink\n(B) toothpaste" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898720_582961570847416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from door (highlighted by a red box)? Select from screen door (highlighted by a blue box) and mirror (highlighted by a green box).\n(A) screen door\n(B) mirror" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204474_25111576182041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, paperback book (highlighted by a red box) or clock (highlighted by a blue box)?\n(A) paperback book\n(B) clock" }, { "from": "gpt", "value": "(A) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334628_386168631914083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, jacuzzi (highlighted by a red box) or towel (highlighted by a blue box)?\n(A) jacuzzi\n(B) towel" }, { "from": "gpt", "value": "(B) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332991_125373693658250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bean bag chair (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) bean bag chair\n(B) furniture" }, { "from": "gpt", "value": "(A) bean bag chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333031_58981138521333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, magazine (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) magazine\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331495_153700415207541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from hole (highlighted by a red box)? medicine cabinet (highlighted by a blue box) or shower door (highlighted by a green box)?\n(A) medicine cabinet\n(B) shower door" }, { "from": "gpt", "value": "(A) medicine cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670183_43201067207916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, sink (highlighted by a red box) or shower curtain (highlighted by a blue box)?\n(A) sink\n(B) shower curtain" }, { "from": "gpt", "value": "(B) shower curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333056_60195595614291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from armoire (highlighted by a red box), electric outlet (highlighted by a blue box) or nightstand (highlighted by a green box)?\n(A) electric outlet\n(B) nightstand" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796745_28691871986083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to electric outlet (highlighted by a red box)? Select from bath (highlighted by a blue box) and electric outlet (highlighted by a green box).\n(A) bath\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445599_285049831311166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cupboard (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) cupboard\n(B) curtain" }, { "from": "gpt", "value": "(A) cupboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669927_14198959735791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, drawer (highlighted by a red box) or drawer (highlighted by a blue box)?\n(A) drawer\n(B) drawer" }, { "from": "gpt", "value": "(A) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896379_20398436292791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, light switch (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) light switch\n(B) radiator" }, { "from": "gpt", "value": "(A) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332398_401507408707291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or book (highlighted by a blue box)?\n(A) chair\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898506_160756196332291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) door\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828506_102428770219291_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to chair (highlighted by a red box)? fireplace (highlighted by a blue box) or fireplace (highlighted by a green box).\n(A) fireplace\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663064_38506492882791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, screen door (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) screen door\n(B) screen door" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828439_90629934747458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, coffeepot (highlighted by a red box) or tableware (highlighted by a blue box)?\n(A) coffeepot\n(B) tableware" }, { "from": "gpt", "value": "(B) tableware" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018915_553471124792166_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332204_264162574990750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, curtain (highlighted by a red box) or animal (highlighted by a blue box)?\n(A) curtain\n(B) animal" }, { "from": "gpt", "value": "(B) animal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897675_148505513091458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to concrete (highlighted by a red box)? Select from bed (highlighted by a blue box) and door (highlighted by a green box).\n(A) bed\n(B) door" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895250_75610990334875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bed (highlighted by a red box)? Choose from radiator (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) radiator\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670358_67310291612125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, screen (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) screen\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896512_33408275941708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from table lamp (highlighted by a red box), pillow (highlighted by a blue box) or material (highlighted by a green box)?\n(A) pillow\n(B) material" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739305_43531970486958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to kitchen appliance (highlighted by a red box), food (highlighted by a blue box) or faucet (highlighted by a green box)?\n(A) food\n(B) faucet" }, { "from": "gpt", "value": "(A) food" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429723_17926643670416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, paper towel (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) paper towel\n(B) appliance" }, { "from": "gpt", "value": "(A) paper towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899030_643007077162833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or fabric (highlighted by a blue box)?\n(A) chair\n(B) fabric" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115118_84659840987416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or floral arrangement (highlighted by a blue box)?\n(A) chair\n(B) floral arrangement" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895796_680677395279250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430978_101929121246166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, pillow (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) pillow\n(B) furniture" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332954_21999990382583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to home appliance (highlighted by a red box)? wok (highlighted by a blue box) or kitchen appliance (highlighted by a green box).\n(A) wok\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) wok" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662870_14528376297125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the shower curtain (highlighted by a red box)? plain (highlighted by a blue box) or toiletry (highlighted by a green box).\n(A) plain\n(B) toiletry" }, { "from": "gpt", "value": "(A) plain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897709_111982307278500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from exhaust hood (highlighted by a red box), oven (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) oven\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446588_206017146240166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, houseplant (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) houseplant\n(B) pillow" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204877_3573028446291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from door (highlighted by a red box)? Select from sink (highlighted by a blue box) and tile (highlighted by a green box).\n(A) sink\n(B) tile" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430217_180289201088291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, home appliance (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) home appliance\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896354_18689101078250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the studio couch (highlighted by a red box)? Choose among these: studio couch (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261666_2572947948125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bidet (highlighted by a red box)? bottle (highlighted by a blue box) or cleaning product (highlighted by a green box).\n(A) bottle\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663007_32290117007750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the picture frame (highlighted by a red box)? Choose among these: table lamp (highlighted by a blue box) or window (highlighted by a green box).\n(A) table lamp\n(B) window" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430935_95022330156458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, ceramic tile (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) ceramic tile\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739351_186514617958083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from table (highlighted by a red box)? Choose from door (highlighted by a blue box) and door (highlighted by a green box).\n(A) door\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358426_41427570693500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toilet (highlighted by a red box) or bath mat (highlighted by a blue box)?\n(A) toilet\n(B) bath mat" }, { "from": "gpt", "value": "(B) bath mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896426_19190739179958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, lamp (highlighted by a red box) or door (highlighted by a blue box)?\n(A) lamp\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897547_473252089295291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cabinetry (highlighted by a red box)? Choose from clothing (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) clothing\n(B) cabinetry" }, { "from": "gpt", "value": "(A) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115195_105684060935083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to box (highlighted by a red box)? box (highlighted by a blue box) or box (highlighted by a green box).\n(A) box\n(B) box" }, { "from": "gpt", "value": "(B) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899630_229917273928750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from mirror (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and radiator (highlighted by a green box).\n(A) studio couch\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444716_75607171951416_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115127_84836934383708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from table lamp (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and round table (highlighted by a green box).\n(A) picture frame\n(B) round table" }, { "from": "gpt", "value": "(B) round table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649720_47952943172833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhere is chair (annotated by the red box) located in relation to chair in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898059_223716138261208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, glass door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) glass door\n(B) door" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897478_112755144277750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, nightstand (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796684_30811138639750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from door (highlighted by a red box)? Choose from appliance (highlighted by a blue box) and door (highlighted by a green box).\n(A) appliance\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115352_4025016462333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of furniture (annotated by the red box) and cupboard in the image provided, where is furniture (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896101_145177202106750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261569_76313323773416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, table lamp (highlighted by a red box) or headboard (highlighted by a blue box)?\n(A) table lamp\n(B) headboard" }, { "from": "gpt", "value": "(B) headboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333274_24130613090791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the paperback book (highlighted by a red box)? shelf (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) shelf\n(B) houseplant" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430294_187656447716000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from book (highlighted by a red box)? book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430401_126669800797916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898808_68981002473666_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, mirror (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) mirror\n(B) screen door" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334207_103269805716166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, shelf (highlighted by a red box) or vase (highlighted by a blue box)?\n(A) shelf\n(B) vase" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899120_129702065629750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, television (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) television\n(B) radiator" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332398_401535413966833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from glass door (highlighted by a red box)? Choose from studio couch (highlighted by a blue box) and glass door (highlighted by a green box).\n(A) studio couch\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429728_19154031901166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is furniture (annotated by the red box) located in relation to silver in the image? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828272_84484786285541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, doormat (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) doormat\n(B) doormat" }, { "from": "gpt", "value": "(A) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739799_14850658128708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, home appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) home appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332808_47981329904833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to electric outlet (highlighted by a red box)? Select from cardboard box (highlighted by a blue box) and table (highlighted by a green box).\n(A) cardboard box\n(B) table" }, { "from": "gpt", "value": "(A) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897971_216907370945916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the cabinetry (highlighted by a red box)? washing machine (highlighted by a blue box) or sink (highlighted by a green box).\n(A) washing machine\n(B) sink" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898530_181152752460416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from appliance (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or tap (highlighted by a green box).\n(A) appliance\n(B) tap" }, { "from": "gpt", "value": "(B) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897462_470064056013583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the table (highlighted by a red box)? Choose among these: mirror (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) mirror\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331512_155312218945541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331684_6442093581750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chest of drawers (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) chest of drawers\n(B) cardboard box" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446485_355866356066833_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358289_15867054077041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649426_10815406561250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bottle (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) bottle\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334539_66455792271707_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from pillow (highlighted by a red box)? Choose from book (highlighted by a blue box) and table (highlighted by a green box).\n(A) book\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333778_48277638471583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, box (highlighted by a red box) or box (highlighted by a blue box)?\n(A) box\n(B) box" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331211_281184252574541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to window sill (highlighted by a red box)? radiator (highlighted by a blue box) or chair (highlighted by a green box).\n(A) radiator\n(B) chair" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358360_16015065177166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, studio couch (highlighted by a red box) or picnic basket (highlighted by a blue box)?\n(A) studio couch\n(B) picnic basket" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895593_1161490184046166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to dresser (highlighted by a red box)? Choose from houseplant (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) houseplant\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669978_28834300597791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of lamp (annotated by the red box) in relation to pattern?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796562_16000472735166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from picture frame (highlighted by a red box)? Select from fireplace (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) fireplace\n(B) picture frame" }, { "from": "gpt", "value": "(A) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115238_97770871295125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, stairwell (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) stairwell\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899353_715991473655000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bath towel (highlighted by a red box) or glass door (highlighted by a blue box)?\n(A) bath towel\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828272_84512791352708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is chair (annotated by the red box) located relative to washing machine? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430862_74307896903500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is window (annotated by the red box) located relative to curtain?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896416_17787030610250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from table lamp (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and changing table (highlighted by a green box).\n(A) pillow\n(B) changing table" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458730_138403217732124_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to tap (highlighted by a red box)? Select from bathroom cabinet (highlighted by a blue box) and cleaning product (highlighted by a green box).\n(A) bathroom cabinet\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895591_1161424577257458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, microwave oven (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) microwave oven\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358673_873089251041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to table (highlighted by a red box), kitchen appliance (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) kitchen appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444751_79707873141208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, electric outlet (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) electric outlet\n(B) doormat" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899364_717560296335208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, sink (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) sink\n(B) screen door" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445599_285061826371875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is chest of drawers (annotated by the red box) located in relation to curtain in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018833_649163955637458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896075_132621612911333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the picture frame (highlighted by a red box)? stuff (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) stuff\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261292_16324741602791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bed (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) pillow\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333003_128369003257166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, cabinet (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) cabinet\n(B) toiletry" }, { "from": "gpt", "value": "(A) cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897605_137325630981541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chest of drawers (highlighted by a red box) or corridor (highlighted by a blue box)?\n(A) chest of drawers\n(B) corridor" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739455_51650394468041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the curtain (highlighted by a red box)? Choose among these: swivel chair (highlighted by a blue box) or window (highlighted by a green box).\n(A) swivel chair\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204271_12684464220958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to toilet (highlighted by a red box)? Choose from toiletry (highlighted by a blue box) and basket (highlighted by a green box).\n(A) toiletry\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828437_90422050792708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from cabinetry (highlighted by a red box)? oven (highlighted by a blue box) or home appliance (highlighted by a green box)?\n(A) oven\n(B) home appliance" }, { "from": "gpt", "value": "(B) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204342_14923709890041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, lamp (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333058_60962460996291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the mouthwash (highlighted by a red box)? Choose among these: mouthwash (highlighted by a blue box) or cleaning product (highlighted by a green box).\n(A) mouthwash\n(B) cleaning product" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669959_27850900228500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window sill (highlighted by a red box) or soap (highlighted by a blue box)?\n(A) window sill\n(B) soap" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649787_45898405496125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, stool (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) stool\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737880525148958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444767_81440880847958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to curtain (highlighted by a red box), pillow (highlighted by a blue box) or canopy bed (highlighted by a green box)?\n(A) pillow\n(B) canopy bed" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331220_282459904149916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from countertop (highlighted by a red box)? cabinetry (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331804_227799979411291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the lamp (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or glass bowl (highlighted by a green box).\n(A) cabinetry\n(B) glass bowl" }, { "from": "gpt", "value": "(B) glass bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430948_96233755742583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, wok (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) wok\n(B) ceramic tile" }, { "from": "gpt", "value": "(A) wok" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332505_343952874108291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, studio couch (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) studio couch\n(B) desk" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458626_127648282144250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from studio couch (highlighted by a red box)? basket (highlighted by a blue box) or desk (highlighted by a green box)?\n(A) basket\n(B) desk" }, { "from": "gpt", "value": "(A) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332083_251878677104291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, window sill (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) window sill\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897631_139520453489125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) door\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445173_8195932159333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458582_1538381352250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, sink (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) sink\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828391_94853690275791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, bed (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) bed\n(B) pillow" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828270_84277288813166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) door\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446057_79887969679333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, furniture (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) furniture\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261344_24359539460125_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115394_3423267071083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, table (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) table\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662905_20074153638291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from headboard (highlighted by a red box)? Select from curtain (highlighted by a blue box) and bedside lamp (highlighted by a green box).\n(A) curtain\n(B) bedside lamp" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649802_46903291233500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662809_13633989441791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from light fixture (highlighted by a red box)? picture frame (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) picture frame\n(B) curtain" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796579_16804166235333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) picture frame\n(B) fireplace" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739455_51634401094958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) table\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331542_6882920183625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, stool (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) stool\n(B) houseplant" }, { "from": "gpt", "value": "(A) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670171_42353211324500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to curtain (highlighted by a red box)? Select from mat (highlighted by a blue box) and table (highlighted by a green box).\n(A) mat\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331525_191685690656250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, sink (highlighted by a red box) or bathtub (highlighted by a blue box)?\n(A) sink\n(B) bathtub" }, { "from": "gpt", "value": "(B) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017894_80952555657416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bottle (highlighted by a red box)? bowl (highlighted by a blue box) or bottle (highlighted by a green box).\n(A) bowl\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018808_19403780713708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chair (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) chair\n(B) concrete" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431083_75386228860708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to sheet (highlighted by a red box)? Select from bottle (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261495_42764775148875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to window (highlighted by a red box)? window (highlighted by a blue box) or window (highlighted by a green box).\n(A) window\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261228_13730710901333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444762_81575475807083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from picture frame (highlighted by a red box)? Select from picture frame (highlighted by a blue box) and nightstand (highlighted by a green box).\n(A) picture frame\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334154_144349169851125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from toiletry (highlighted by a red box)? Select from shelf (highlighted by a blue box) and toiletry (highlighted by a green box).\n(A) shelf\n(B) toiletry" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358225_9573342647375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, corded phone (highlighted by a red box) or book (highlighted by a blue box)?\n(A) corded phone\n(B) book" }, { "from": "gpt", "value": "(A) corded phone" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332109_683181703879041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, furniture (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) furniture\n(B) toilet paper" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261569_76341328852791_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from furniture (highlighted by a red box)? door (highlighted by a blue box) or dresser (highlighted by a green box)?\n(A) door\n(B) dresser" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446074_137222796364457_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from soap dispenser (highlighted by a red box)? Choose among these: toilet bowl (highlighted by a blue box) or bath towel (highlighted by a green box).\n(A) toilet bowl\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670201_53323406198875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the lamp (highlighted by a red box)? Choose among these: radiator (highlighted by a blue box) or shutter (highlighted by a green box).\n(A) radiator\n(B) shutter" }, { "from": "gpt", "value": "(B) shutter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430439_1090453923247_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to door (highlighted by a red box)? Select from door (highlighted by a blue box) and table (highlighted by a green box).\n(A) door\n(B) table" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333281_25532125290375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from table (highlighted by a red box)? paperback book (highlighted by a blue box) or tissue (highlighted by a green box)?\n(A) paperback book\n(B) tissue" }, { "from": "gpt", "value": "(B) tissue" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261455_35859447207416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to pillow (highlighted by a red box)? Choose from wall clock (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) wall clock\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828441_91561041231375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331496_153621413789125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from mouthwash (highlighted by a red box)? Choose from mouthwash (highlighted by a blue box) and toiletry (highlighted by a green box).\n(A) mouthwash\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899057_647037492644500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from television (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and furniture (highlighted by a green box).\n(A) furniture\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897728_114211531292250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, studio couch (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) studio couch\n(B) concrete" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333055_60403394595916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from door (highlighted by a red box)? electric outlet (highlighted by a blue box) or door (highlighted by a green box)?\n(A) electric outlet\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897547_473250090118583_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828442_91408135131625_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window screen (highlighted by a red box) or door (highlighted by a blue box)?\n(A) window screen\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898261_696833938665833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, speaker (highlighted by a red box) or mouse (highlighted by a blue box)?\n(A) speaker\n(B) mouse" }, { "from": "gpt", "value": "(B) mouse" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649474_14627234503041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to shelf (highlighted by a red box), book (highlighted by a blue box) or table lamp (highlighted by a green box)?\n(A) book\n(B) table lamp" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649603_36061599688083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, chair (highlighted by a red box) or door (highlighted by a blue box)?\n(A) chair\n(B) door" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897780_129136924888500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the lamp (highlighted by a red box)? pillow (highlighted by a blue box) or nightstand (highlighted by a green box).\n(A) pillow\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649798_46220611299291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896494_31429935170125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of screen door (annotated by the red box) in relation to towel?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334720_534735622981750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332026_202737094237208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the armchair (highlighted by a red box)? pillow (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446607_88202782064625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from stool (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and table lamp (highlighted by a green box).\n(A) studio couch\n(B) table lamp" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670346_66294492437416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, plant (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) plant\n(B) shelf" }, { "from": "gpt", "value": "(A) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899935_863099780688416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of lamp (annotated by the red box) and furniture in the image provided, where is lamp (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796579_16820176274623_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to door (highlighted by a red box)? Select from fireplace (highlighted by a blue box) and furniture (highlighted by a green box).\n(A) fireplace\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739690_1116138366250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from picture frame (highlighted by a red box), picture frame (highlighted by a blue box) or window (highlighted by a green box)?\n(A) picture frame\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445137_5575141169916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from towel (highlighted by a red box)? Choose among these: radiator (highlighted by a blue box) or towel (highlighted by a green box).\n(A) radiator\n(B) towel" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663312_76710876811208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toiletry (highlighted by a red box)? mouthwash (highlighted by a blue box) or toothpaste (highlighted by a green box).\n(A) mouthwash\n(B) toothpaste" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358168_61156035884750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from wall clock (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) door\n(B) studio couch" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445100_9166776412750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, curtain (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) curtain\n(B) curtain" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670291_62196211883041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to cabinetry (highlighted by a red box)? Choose from kitchen appliance (highlighted by a blue box) and gas stove (highlighted by a green box).\n(A) kitchen appliance\n(B) gas stove" }, { "from": "gpt", "value": "(A) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204481_24874670180958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from curtain (highlighted by a red box)? picture frame (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331388_198865299577583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from shelf (highlighted by a red box)? counter (highlighted by a blue box) or basket (highlighted by a green box)?\n(A) counter\n(B) basket" }, { "from": "gpt", "value": "(A) counter" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796212_1489457030583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from window sill (highlighted by a red box)? Choose from furniture (highlighted by a blue box) and sheet (highlighted by a green box).\n(A) furniture\n(B) sheet" }, { "from": "gpt", "value": "(B) sheet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739740_3762508425041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or door (highlighted by a blue box)?\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429816_744587893156375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from screen door (highlighted by a red box)? Select from shelf (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) shelf\n(B) screen door" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332401_406053370758416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, appliance (highlighted by a red box) or gas stove (highlighted by a blue box)?\n(A) appliance\n(B) gas stove" }, { "from": "gpt", "value": "(B) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649393_11171700664708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: table lamp (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) table lamp\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358234_9908772790875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, mirror (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) mirror\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649794_46070803942583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, exhaust hood (highlighted by a red box) or dot (highlighted by a blue box)?\n(A) exhaust hood\n(B) dot" }, { "from": "gpt", "value": "(B) dot" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896379_20411947344541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhere is knob (annotated by the red box) located in relation to chest of drawers in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018757_14886656134791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the cabinetry (highlighted by a red box)? houseplant (highlighted by a blue box) or table (highlighted by a green box).\n(A) houseplant\n(B) table" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896195_142294040345416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, curtain (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) curtain\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444923_220932441303916_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446445_354387137516916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) picture frame\n(B) chair" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331627_20078045471875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, gas stove (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) gas stove\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261569_76311324601125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, radiator (highlighted by a red box) or cabinet (highlighted by a blue box)?\n(A) radiator\n(B) cabinet" }, { "from": "gpt", "value": "(B) cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649787_45937006882041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from chair (highlighted by a red box)? Choose from chair (highlighted by a blue box) and chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204350_15588028664375_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to door (highlighted by a red box)? Select from chair (highlighted by a blue box) and door (highlighted by a green box).\n(A) chair\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204319_15927962396958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from lamp (highlighted by a red box)? window (highlighted by a blue box) or door (highlighted by a green box)?\n(A) window\n(B) door" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895469_132746019447041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, picture frame (highlighted by a red box) or television (highlighted by a blue box)?\n(A) picture frame\n(B) television" }, { "from": "gpt", "value": "(B) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458245_78517507110125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to basket (highlighted by a red box)? Select from cabinetry (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261728_2856296802166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204730_23424627812708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from door (highlighted by a red box)? Choose among these: lamp (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) lamp\n(B) studio couch" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670244_63593311095500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the cabinetry (highlighted by a red box)? Choose among these: shoe (highlighted by a blue box) or shoe (highlighted by a green box).\n(A) shoe\n(B) shoe" }, { "from": "gpt", "value": "(A) shoe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895635_471899692326291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bookcase (highlighted by a red box) or book (highlighted by a blue box)?\n(A) bookcase\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331934_163619797674416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from plastic bag (highlighted by a red box)? Select from table top (highlighted by a blue box) and food (highlighted by a green box).\n(A) table top\n(B) food" }, { "from": "gpt", "value": "(A) table top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895233_73797190740375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, countertop (highlighted by a red box) or drawer (highlighted by a blue box)?\n(A) countertop\n(B) drawer" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261666_2557254448666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is air conditioning (annotated by the red box) located relative to air conditioning?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669851_12535862093250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the chair (highlighted by a red box)? Choose among these: screen door (highlighted by a blue box) or doormat (highlighted by a green box).\n(A) screen door\n(B) doormat" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431078_74748101792166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737737033082208_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the stove (highlighted by a red box)? Choose among these: bottle (highlighted by a blue box) or tap (highlighted by a green box).\n(A) bottle\n(B) tap" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261096_1362441141208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, bowl (highlighted by a red box) or apple (highlighted by a blue box)?\n(A) bowl\n(B) apple" }, { "from": "gpt", "value": "(A) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828250_81661492658291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of curtain (annotated by the red box) in relation to door? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334066_87437210692583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toilet paper (highlighted by a red box), shelf (highlighted by a blue box) or toilet (highlighted by a green box)?\n(A) shelf\n(B) toilet" }, { "from": "gpt", "value": "(B) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115205_95177834677541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table lamp (highlighted by a red box) or window (highlighted by a blue box)?\n(A) table lamp\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445627_58202070573083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is curtain (annotated by the red box) located relative to window? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739276_42739463476875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, window (highlighted by a red box) or light fixture (highlighted by a blue box)?\n(A) window\n(B) light fixture" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898256_696572929295291_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445695_57380282701791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, footwear (highlighted by a red box) or pavement (highlighted by a blue box)?\n(A) footwear\n(B) pavement" }, { "from": "gpt", "value": "(A) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430294_187711258780833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the book (highlighted by a red box)? table (highlighted by a blue box) or book (highlighted by a green box).\n(A) table\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333840_54045572884833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, picture frame (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) picture frame\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261108_1101049442083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from chair (highlighted by a red box)? Select from table (highlighted by a blue box) and chair (highlighted by a green box).\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261251_12643498098291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) chair\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333031_59058923584208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) table\n(B) studio couch" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670208_54173667229000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, footwear (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) footwear\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649464_13863136954166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to book (highlighted by a red box)? Choose from table (highlighted by a blue box) and book (highlighted by a green box).\n(A) table\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897439_105068833262916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, curtain (highlighted by a red box) or balustrade (highlighted by a blue box)?\n(A) curtain\n(B) balustrade" }, { "from": "gpt", "value": "(B) balustrade" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458511_113804650069958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to door (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and light switch (highlighted by a green box).\n(A) picture frame\n(B) light switch" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670158_40723930492750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332072_249965081531125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from door (highlighted by a red box)? Select from fridge (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) fridge\n(B) screen door" }, { "from": "gpt", "value": "(A) fridge" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204820_28643229349416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of shoe (annotated by the red box) and furniture in the image provided, where is shoe (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429739_20094567613625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from person (highlighted by a red box)? book (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) book\n(B) picture frame" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331053_482530325550791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, screen door (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) screen door\n(B) appliance" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334896_1084495938496958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to beach towel (highlighted by a red box)? Choose from footwear (highlighted by a blue box) and sink (highlighted by a green box).\n(A) footwear\n(B) sink" }, { "from": "gpt", "value": "(A) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896117_146013617444375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from picture frame (highlighted by a red box)? shelf (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) shelf\n(B) shelf" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828328_77668571352250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, furniture (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) furniture\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445612_56526304414708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to picture frame (highlighted by a red box), lamp (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) lamp\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898349_509473016060875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, toilet paper (highlighted by a red box) or sink (highlighted by a blue box)?\n(A) toilet paper\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358378_19058951022250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to table (highlighted by a red box)? Select from television (highlighted by a blue box) and table (highlighted by a green box).\n(A) television\n(B) table" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897490_471228816395750_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) chair\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332505_343938879779541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to armchair (highlighted by a red box)? Choose from chair (highlighted by a blue box) and chair (highlighted by a green box).\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334057_86198894759291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, houseplant (highlighted by a red box) or window blind (highlighted by a blue box)?\n(A) houseplant\n(B) window blind" }, { "from": "gpt", "value": "(B) window blind" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018239_469391649284000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of bean bag chair (annotated by the red box) in reference to curtain?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670224_53949160667250_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) cabinetry\n(B) clothing" }, { "from": "gpt", "value": "(B) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261201_11545979295000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or counter top (highlighted by a blue box)?\n(A) table\n(B) counter top" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430212_688639247515791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, picture frame (highlighted by a red box) or ceramic tile (highlighted by a blue box)?\n(A) picture frame\n(B) ceramic tile" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897804_131504407806915_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from kitchen appliance (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or kitchen appliance (highlighted by a green box).\n(A) cabinetry\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333840_54097768366750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the furniture (highlighted by a red box)? Choose among these: flannel (highlighted by a blue box) or blanket (highlighted by a green box).\n(A) flannel\n(B) blanket" }, { "from": "gpt", "value": "(A) flannel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739414_191332471861750_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhere is chest of drawers (annotated by the red box) located in relation to concrete in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334912_1089964477558791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from furniture (highlighted by a red box)? Select from table (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) table\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895793_680518592913958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, houseplant (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430246_182549578422416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to table (highlighted by a red box), bookcase (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) bookcase\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115574_2481213740125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, electric outlet (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) electric outlet\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649590_35396731818791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window (highlighted by a red box) or clock (highlighted by a blue box)?\n(A) window\n(B) clock" }, { "from": "gpt", "value": "(B) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358386_19240745523125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to pillow (highlighted by a red box)? studio couch (highlighted by a blue box) or table (highlighted by a green box).\n(A) studio couch\n(B) table" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331277_13045948149291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, frying pan (highlighted by a red box) or frying pan (highlighted by a blue box)?\n(A) frying pan\n(B) frying pan" }, { "from": "gpt", "value": "(B) frying pan" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358345_15200817066041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cat bed (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) cat bed\n(B) studio couch" }, { "from": "gpt", "value": "(A) cat bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204305_15274267775250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, window sill (highlighted by a red box) or window frame (highlighted by a blue box)?\n(A) window sill\n(B) window frame" }, { "from": "gpt", "value": "(B) window frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896063_132110992897750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from picture frame (highlighted by a red box)? Choose from writing (highlighted by a blue box) and glass door (highlighted by a green box).\n(A) writing\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898720_582951674920041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from lamp (highlighted by a red box)? Choose from light switch (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) light switch\n(B) screen door" }, { "from": "gpt", "value": "(A) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332204_264156577418832_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from plant (highlighted by a red box)? Choose among these: floral arrangement (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) floral arrangement\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670201_53325405370750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, coffee table (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) coffee table\n(B) desk" }, { "from": "gpt", "value": "(A) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331938_164821925923583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window (highlighted by a red box), swivel chair (highlighted by a blue box) or radiator (highlighted by a green box)?\n(A) swivel chair\n(B) radiator" }, { "from": "gpt", "value": "(A) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670183_43189055293166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to toilet paper (highlighted by a red box)? bag (highlighted by a blue box) or bath (highlighted by a green box).\n(A) bag\n(B) bath" }, { "from": "gpt", "value": "(B) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444768_81532776630916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, furniture (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) furniture\n(B) furniture" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458757_141680449093833_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bed (highlighted by a red box)? Choose among these: footwear (highlighted by a blue box) or footwear (highlighted by a green box).\n(A) footwear\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261248_15156799501625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bookcase (highlighted by a red box) or book (highlighted by a blue box)?\n(A) bookcase\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331202_279430979742873_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or bowl (highlighted by a blue box)?\n(A) chair\n(B) bowl" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261206_11688470307208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, pillow (highlighted by a red box) or glass bowl (highlighted by a blue box)?\n(A) pillow\n(B) glass bowl" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445462_151094331922000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window (highlighted by a red box), screen door (highlighted by a blue box) or postcard (highlighted by a green box)?\n(A) screen door\n(B) postcard" }, { "from": "gpt", "value": "(B) postcard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332109_683177705487833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, furniture (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) furniture\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899630_229933567455375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is book (annotated by the red box) located relative to desk?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430293_187360351016666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to shelf (highlighted by a red box)? Select from curtain (highlighted by a blue box) and table lamp (highlighted by a green box).\n(A) curtain\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334040_278935914437500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, wall clock (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) wall clock\n(B) lamp" }, { "from": "gpt", "value": "(A) wall clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334883_622617683347958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to curtain (highlighted by a red box), banana (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) banana\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334147_142761223870958_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334890_623251957839208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bathroom cabinet (highlighted by a red box) or soap (highlighted by a blue box)?\n(A) bathroom cabinet\n(B) soap" }, { "from": "gpt", "value": "(B) soap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261357_25840227092583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, countertop (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) countertop\n(B) bottle" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332295_385457398459791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, lamp (highlighted by a red box) or yoga mat (highlighted by a blue box)?\n(A) lamp\n(B) yoga mat" }, { "from": "gpt", "value": "(B) yoga mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445487_153417400046625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, radiator (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) radiator\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897713_111842398796333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, radiator (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) radiator\n(B) furniture" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899936_863438273852833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739417_191285457124250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to door (highlighted by a red box), screen door (highlighted by a blue box) or lamp (highlighted by a green box)?\n(A) screen door\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430983_101593024766666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from coffee cup (highlighted by a red box)? cabinetry (highlighted by a blue box) or mug (highlighted by a green box)?\n(A) cabinetry\n(B) mug" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649590_35410726020333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from gas stove (highlighted by a red box)? Choose among these: home appliance (highlighted by a blue box) or kitchen appliance (highlighted by a green box).\n(A) home appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430928_92929573466291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from light fixture (highlighted by a red box), counter top (highlighted by a blue box) or door (highlighted by a green box)?\n(A) counter top\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333274_24098609426875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261571_76522220589583_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to bed (highlighted by a red box)? door (highlighted by a blue box) or power outlet (highlighted by a green box).\n(A) door\n(B) power outlet" }, { "from": "gpt", "value": "(B) power outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333293_26536634849166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to toilet paper (highlighted by a red box), toilet (highlighted by a blue box) or toilet paper (highlighted by a green box)?\n(A) toilet\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333194_47271938730125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cabinetry (highlighted by a red box) or kettle (highlighted by a blue box)?\n(A) cabinetry\n(B) kettle" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333583_207380136553166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of curtain (annotated by the red box) in relation to animal? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334213_105825497409041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from turquoise (highlighted by a red box)? toothbrush (highlighted by a blue box) or sink (highlighted by a green box)?\n(A) toothbrush\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896494_31439947695291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, towel (highlighted by a red box) or faucet (highlighted by a blue box)?\n(A) towel\n(B) faucet" }, { "from": "gpt", "value": "(A) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332295_385433391548625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or food (highlighted by a blue box)?\n(A) chair\n(B) food" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333281_25646528457333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to dumbbell (highlighted by a red box), chair (highlighted by a blue box) or beach towel (highlighted by a green box)?\n(A) chair\n(B) beach towel" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898983_823801400838000_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115624_3701100244416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, cupboard (highlighted by a red box) or drawer (highlighted by a blue box)?\n(A) cupboard\n(B) drawer" }, { "from": "gpt", "value": "(B) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333319_28521139655416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to crate (highlighted by a red box)? Choose from counter top (highlighted by a blue box) and radiator (highlighted by a green box).\n(A) counter top\n(B) radiator" }, { "from": "gpt", "value": "(A) counter top" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204852_1553536834666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bathroom cabinet (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bathroom cabinet\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331128_174148535469875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, book (highlighted by a red box) or bookcase (highlighted by a blue box)?\n(A) book\n(B) bookcase" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896010_137088662038457_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) table\n(B) studio couch" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429854_12605549971291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bathtub (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) bathtub\n(B) tap" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261688_304443184000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, electric outlet (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) electric outlet\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649382_10552255132041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, dresser (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) dresser\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663009_32454515324083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window (highlighted by a red box) or window (highlighted by a blue box)?\n(A) window\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204726_23613915996583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bay window (highlighted by a red box)? Choose from curtain (highlighted by a blue box) and lamp (highlighted by a green box).\n(A) curtain\n(B) lamp" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895298_91057137169750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the chair (highlighted by a red box)? tableware (highlighted by a blue box) or radiator (highlighted by a green box).\n(A) tableware\n(B) radiator" }, { "from": "gpt", "value": "(A) tableware" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828442_91398139094250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to studio couch (highlighted by a red box)? coffee table (highlighted by a blue box) or chair (highlighted by a green box).\n(A) coffee table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331216_281057054173750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is chair (annotated by the red box) located relative to hat? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896042_130063240070250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the light fixture (highlighted by a red box)? Choose among these: shower (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) shower\n(B) screen door" }, { "from": "gpt", "value": "(A) shower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47330995_176925285232875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, kitchen appliance (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) kitchen appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897948_351377903021791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of curtain (annotated by the red box) in reference to curtain?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445079_5557317710000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from window (highlighted by a red box)? curtain (highlighted by a blue box) or bed (highlighted by a green box)?\n(A) curtain\n(B) bed" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115136_85982738219791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bathtub (highlighted by a red box)? cleaning product (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) cleaning product\n(B) curtain" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334039_278817112774791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, appliance (highlighted by a red box) or window (highlighted by a blue box)?\n(A) appliance\n(B) window" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333159_41496622029166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649742_49606992693958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from book (highlighted by a red box)? swivel chair (highlighted by a blue box) or document (highlighted by a green box)?\n(A) swivel chair\n(B) document" }, { "from": "gpt", "value": "(B) document" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895482_134719421927500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of shelf (annotated by the red box) in relation to book?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897722_114374630092208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, paperback book (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) paperback book\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204828_28547617157708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, lamp (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) lamp\n(B) table lamp" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896089_143948091391333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, exhaust hood (highlighted by a red box) or gas stove (highlighted by a blue box)?\n(A) exhaust hood\n(B) gas stove" }, { "from": "gpt", "value": "(B) gas stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458286_76234033102541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, curtain (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) curtain\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261544_75089855397458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is magazine (annotated by the red box) located relative to toilet paper? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662950_24224415035083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, door (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) door\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333164_42716301537625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toilet (highlighted by a red box) or blanket (highlighted by a blue box)?\n(A) toilet\n(B) blanket" }, { "from": "gpt", "value": "(A) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899285_885263561922083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, home appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) home appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649403_9544368081833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, furniture (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) furniture\n(B) basket" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204453_23113582016083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the chair (highlighted by a red box)? table (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) table\n(B) studio couch" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458452_118134140201250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinet (highlighted by a red box) or cabinet (highlighted by a blue box)?\n(A) cabinet\n(B) cabinet" }, { "from": "gpt", "value": "(A) cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018276_794875077823875_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332026_202753104389000_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, laptop (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) laptop\n(B) radiator" }, { "from": "gpt", "value": "(A) laptop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669878_10474340641416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from vase (highlighted by a red box)? cabinetry (highlighted by a blue box) or door (highlighted by a green box)?\n(A) cabinetry\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334052_85626333753541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, countertop (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) countertop\n(B) kitchen appliance" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796446_601717445416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from pillow (highlighted by a red box)? bed (highlighted by a blue box) or glass door (highlighted by a green box)?\n(A) bed\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899236_880525934034708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from pillow (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649756_51899641618041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, sink (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) sink\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828340_78893436563583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the table lamp (highlighted by a red box)? pillow (highlighted by a blue box) or swivel chair (highlighted by a green box).\n(A) pillow\n(B) swivel chair" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430236_181857076665958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, mouthwash (highlighted by a red box) or mouthwash (highlighted by a blue box)?\n(A) mouthwash\n(B) mouthwash" }, { "from": "gpt", "value": "(A) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204786_27295567507458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899030_643088776811250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, plant (highlighted by a red box) or book (highlighted by a blue box)?\n(A) plant\n(B) book" }, { "from": "gpt", "value": "(A) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331346_192272518309958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from bottle (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and wine bottle (highlighted by a green box).\n(A) cabinetry\n(B) wine bottle" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358230_10024158304375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window (highlighted by a red box) or package (highlighted by a blue box)?\n(A) window\n(B) package" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018585_5503200300583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the window screen (highlighted by a red box)? Choose among these: curtain (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) curtain\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430931_92869381292458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from person (highlighted by a red box)? Choose among these: poster (highlighted by a blue box) or postcard (highlighted by a green box).\n(A) poster\n(B) postcard" }, { "from": "gpt", "value": "(A) poster" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115265_115193274740041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from pillow (highlighted by a red box), electric outlet (highlighted by a blue box) or nightstand (highlighted by a green box)?\n(A) electric outlet\n(B) nightstand" }, { "from": "gpt", "value": "(A) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334608_385009959263625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from curtain (highlighted by a red box), guitar (highlighted by a blue box) or window screen (highlighted by a green box)?\n(A) guitar\n(B) window screen" }, { "from": "gpt", "value": "(A) guitar" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204830_535945110375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, plant (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) plant\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204747_25248686761375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333031_59010826470416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of chest of drawers (annotated by the red box) in relation to picture frame?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358418_41199916941708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toilet paper (highlighted by a red box), toilet paper (highlighted by a blue box) or toilet paper (highlighted by a green box)?\n(A) toilet paper\n(B) toilet paper" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204335_15038297908791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to lamp (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261565_76406435230458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to radiator (highlighted by a red box)? Choose from nightstand (highlighted by a blue box) and window sill (highlighted by a green box).\n(A) nightstand\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899650_233812272076750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) table\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331476_151032232234833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, table (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) table\n(B) window screen" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334967_669357388139416_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430814_65783687543416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the refrigerator (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) appliance\n(B) screen door" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333275_24796507008916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to pillow (highlighted by a red box)? Choose from laptop (highlighted by a blue box) and balloon (highlighted by a green box).\n(A) laptop\n(B) balloon" }, { "from": "gpt", "value": "(A) laptop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018089_104008326211500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) curtain\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899513_197677244694541_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898358_511578570357291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from appliance (highlighted by a red box)? Select from appliance (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115227_95900745356458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from bottle (highlighted by a red box)? Select from lamp (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) lamp\n(B) bottle" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358173_62431039741250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from floral arrangement (highlighted by a red box)? glass door (highlighted by a blue box) or screen door (highlighted by a green box)?\n(A) glass door\n(B) screen door" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895796_680729407518916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chest of drawers (highlighted by a red box) or television (highlighted by a blue box)?\n(A) chest of drawers\n(B) television" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796562_15956474290708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the chair (highlighted by a red box)? Choose among these: window (highlighted by a blue box) or radiator (highlighted by a green box).\n(A) window\n(B) radiator" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333973_47890982108666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of table (annotated by the red box) and log in the image provided, where is table (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204517_757158226125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446485_355826355776416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, pad (highlighted by a red box) or pad (highlighted by a blue box)?\n(A) pad\n(B) pad" }, { "from": "gpt", "value": "(A) pad" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895911_111458840832875_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444789_50497495600916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is shower curtain (annotated by the red box) located relative to curtain?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334202_103311005766208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) table\n(B) houseplant" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895233_73857182921833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, tableware (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) tableware\n(B) cabinetry" }, { "from": "gpt", "value": "(A) tableware" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331273_12865155314666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from mixing bowl (highlighted by a red box)? Select from cabinet (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) cabinet\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332204_264182883435458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, warning sign (highlighted by a red box) or postcard (highlighted by a blue box)?\n(A) warning sign\n(B) postcard" }, { "from": "gpt", "value": "(A) warning sign" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333018_130143211057333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or clock (highlighted by a blue box)?\n(A) picture frame\n(B) clock" }, { "from": "gpt", "value": "(B) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358693_3138721151166_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, considering the relative positions of fireplace (annotated by the red box) and window sill in the image provided, where is fireplace (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445639_58352774815666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331625_20150832607416_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from appliance (highlighted by a red box)? Choose from shelf (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) shelf\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358121_62407081543583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the television (highlighted by a red box)? picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445834_68165680397541_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670288_62112311723875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, houseplant (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) houseplant\n(B) screen door" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895199_39510112575958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, swivel chair (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) swivel chair\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828150_73397403717625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, step stool (highlighted by a red box) or table (highlighted by a blue box)?\n(A) step stool\n(B) table" }, { "from": "gpt", "value": "(A) step stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670293_62059915772416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, window (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) window\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018550_830278734415375_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898899_816896731715250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, floral arrangement (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) floral arrangement\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446574_86432065420500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, appliance (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018090_104085728236833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, toiletry (highlighted by a red box) or mouthwash (highlighted by a blue box)?\n(A) toiletry\n(B) mouthwash" }, { "from": "gpt", "value": "(B) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670250_63471111707458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, appliance (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) appliance\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662875_14445375812708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chest of drawers (highlighted by a red box) or mattress (highlighted by a blue box)?\n(A) chest of drawers\n(B) mattress" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204920_3732895578458_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, nightstand (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) nightstand\n(B) bed" }, { "from": "gpt", "value": "(A) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828391_94918696705083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of toilet (annotated by the red box) and bath in the image provided, where is toilet (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018808_19377774583541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or door (highlighted by a blue box)?\n(A) chair\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895279_79301908912541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to cabinetry (highlighted by a red box)? stairwell (highlighted by a blue box) or door (highlighted by a green box).\n(A) stairwell\n(B) door" }, { "from": "gpt", "value": "(A) stairwell" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899034_643200912445916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333803_51412554083541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to curtain (highlighted by a red box)? swivel chair (highlighted by a blue box) or glass door (highlighted by a green box).\n(A) swivel chair\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430901_80993365287375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or cardboard box (highlighted by a blue box)?\n(A) door\n(B) cardboard box" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332183_262823415761916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, infant bed (highlighted by a red box) or chest of drawers (highlighted by a blue box)?\n(A) infant bed\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) infant bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458690_135442795085875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from television (highlighted by a red box)? footrest (highlighted by a blue box) or desk (highlighted by a green box)?\n(A) footrest\n(B) desk" }, { "from": "gpt", "value": "(A) footrest" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018612_633094720796041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, lamp (highlighted by a red box) or window (highlighted by a blue box)?\n(A) lamp\n(B) window" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895482_134659229815875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, animal (highlighted by a red box) or animal (highlighted by a blue box)?\n(A) animal\n(B) animal" }, { "from": "gpt", "value": "(A) animal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332314_387842145462125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of power plugs and sockets (annotated by the red box) in relation to laundry?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332177_262460112896625_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from shelf (highlighted by a red box)? Choose among these: shelf (highlighted by a blue box) or luggage (highlighted by a green box).\n(A) shelf\n(B) luggage" }, { "from": "gpt", "value": "(B) luggage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898917_816683235471958_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649714_47794659000125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the plant (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or appliance (highlighted by a green box).\n(A) picture frame\n(B) appliance" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649403_9548366501333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, laundry basket (highlighted by a red box) or luggage (highlighted by a blue box)?\n(A) laundry basket\n(B) luggage" }, { "from": "gpt", "value": "(B) luggage" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898560_183732598018333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) furniture\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115283_118324732020916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, coffee machine (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) coffee machine\n(B) bottle" }, { "from": "gpt", "value": "(A) coffee machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669936_14829895681250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, shoe (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) shoe\n(B) mat" }, { "from": "gpt", "value": "(A) shoe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670358_67306276537291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from computer screen (highlighted by a red box)? Choose from window sill (highlighted by a blue box) and window (highlighted by a green box).\n(A) window sill\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898256_696542341842083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the book (highlighted by a red box)? computer monitor (highlighted by a blue box) or man (highlighted by a green box).\n(A) computer monitor\n(B) man" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018098_367381311301250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, screen door (highlighted by a red box) or knob (highlighted by a blue box)?\n(A) screen door\n(B) knob" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446444_82548617599583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of screen door (annotated by the red box) in reference to fruit?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358661_1200992800125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896162_139845581604125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to cleaning product (highlighted by a red box)? Select from mirror (highlighted by a blue box) and cleaning product (highlighted by a green box).\n(A) mirror\n(B) cleaning product" }, { "from": "gpt", "value": "(B) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430519_298843623038791_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333056_60167090488625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to houseplant (highlighted by a red box)? Select from book (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) book\n(B) curtain" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358230_10108556618375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the electric outlet (highlighted by a red box)? bed (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) bed\n(B) electric outlet" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333265_21714115153416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to appliance (highlighted by a red box), postcard (highlighted by a blue box) or notepad (highlighted by a green box)?\n(A) postcard\n(B) notepad" }, { "from": "gpt", "value": "(A) postcard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896249_7545493503041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to hospital bed (highlighted by a red box)? Select from bed (highlighted by a blue box) and window (highlighted by a green box).\n(A) bed\n(B) window" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115222_95794739391416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table (highlighted by a red box) or candle holder (highlighted by a blue box)?\n(A) table\n(B) candle holder" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018833_649133967765916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window (highlighted by a red box)? Select from curtain (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) curtain\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737727037112333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of counter (annotated by the red box) in relation to cabinetry? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358281_9115522620125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of chest of drawers (annotated by the red box) in reference to waste container? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899600_202652425956083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhere is stool (annotated by the red box) located in relation to glass vase in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334079_88623186576416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from power outlet (highlighted by a red box)? Choose from blanket (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) blanket\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896429_19272540139416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from chest of drawers (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or electric outlet (highlighted by a green box).\n(A) picture frame\n(B) electric outlet" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895623_470809441581833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bath (highlighted by a red box)? waste container (highlighted by a blue box) or bath mat (highlighted by a green box).\n(A) waste container\n(B) bath mat" }, { "from": "gpt", "value": "(A) waste container" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899603_202414141262250_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from stool (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and table lamp (highlighted by a green box).\n(A) picture frame\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896038_130016941722500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the toiletry (highlighted by a red box)? tap (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) tap\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333117_114376650124708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to window (highlighted by a red box)? Select from curtain (highlighted by a blue box) and handbag (highlighted by a green box).\n(A) curtain\n(B) handbag" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447275_408607603754041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649692_36051757693500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from table lamp (highlighted by a red box)? Choose from bed (highlighted by a blue box) and nightstand (highlighted by a green box).\n(A) bed\n(B) nightstand" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331762_7368246939375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332207_264631967925707_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, pillow (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) pillow\n(B) toy" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358386_19308751928291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, lamp (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) lamp\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261313_22299847130708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to studio couch (highlighted by a red box)? Select from studio couch (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429804_737545526885333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is curtain (annotated by the red box) located relative to radiator?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018455_527110058467958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to soap dispenser (highlighted by a red box)? mouthwash (highlighted by a blue box) or sink (highlighted by a green box).\n(A) mouthwash\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445689_61669873525958_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204724_23528518102750_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, entertainment center (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) entertainment center\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430141_33567172788208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, wide (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) wide\n(B) desk" }, { "from": "gpt", "value": "(A) wide" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649615_36968262899958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from bath towel (highlighted by a red box), towel bar (highlighted by a blue box) or bathtub (highlighted by a green box)?\n(A) towel bar\n(B) bathtub" }, { "from": "gpt", "value": "(B) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331627_20082043850708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334227_107020312999125_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from cardboard box (highlighted by a red box)? window screen (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) window screen\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334867_620693915615291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331294_14727247057916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, clothing (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) clothing\n(B) clothing" }, { "from": "gpt", "value": "(A) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331542_6914907283541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to pillow (highlighted by a red box), blanket (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) blanket\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898695_581023780781083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from blanket (highlighted by a red box)? Select from stool (highlighted by a blue box) and table lamp (highlighted by a green box).\n(A) stool\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895448_129473082134541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, closet (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) closet\n(B) toiletry" }, { "from": "gpt", "value": "(A) closet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662886_16461693118000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, armchair (highlighted by a red box) or window (highlighted by a blue box)?\n(A) armchair\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331343_192407413576166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the appliance (highlighted by a red box)? appliance (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) appliance\n(B) curtain" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018757_14910663129625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from window (highlighted by a red box)? Choose from window (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) window\n(B) houseplant" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445770_65537435445166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from chair (highlighted by a red box)? Choose from bed (highlighted by a blue box) and table (highlighted by a green box).\n(A) bed\n(B) table" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115126_84584938668458_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, mirror (highlighted by a red box) or plain (highlighted by a blue box)?\n(A) mirror\n(B) plain" }, { "from": "gpt", "value": "(B) plain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446579_205787441086291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from table (highlighted by a red box)? pillow (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649478_15081138167750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the studio couch (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) pillow\n(B) picture frame" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445716_63693895436791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from bathtub (highlighted by a red box), soap dispenser (highlighted by a blue box) or sink (highlighted by a green box)?\n(A) soap dispenser\n(B) sink" }, { "from": "gpt", "value": "(B) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333244_33530207570125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to table (highlighted by a red box)? furniture (highlighted by a blue box) or table (highlighted by a green box).\n(A) furniture\n(B) table" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669927_14210971651625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the coffee table (highlighted by a red box)? table (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) table\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896216_4211642875415_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of window (annotated by the red box) in reference to wire?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(A) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331707_11125914286708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, cabinetry (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) cabinetry\n(B) bottle" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897409_103022481191791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to glass door (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and radiator (highlighted by a green box).\n(A) cabinetry\n(B) radiator" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899950_864933623958000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chest of drawers (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) chest of drawers\n(B) doormat" }, { "from": "gpt", "value": "(A) chest of drawers" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899643_231929989872166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bed (highlighted by a red box)? Choose from material (highlighted by a blue box) and nightstand (highlighted by a green box).\n(A) material\n(B) nightstand" }, { "from": "gpt", "value": "(A) material" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332152_259935933044625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from book (highlighted by a red box)? paperback book (highlighted by a blue box) or shelf (highlighted by a green box)?\n(A) paperback book\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018284_799362113042125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to pillow (highlighted by a red box)? baby carriage (highlighted by a blue box) or screen door (highlighted by a green box).\n(A) baby carriage\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332106_683007807156250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from counter top (highlighted by a red box)? Select from mat (highlighted by a blue box) and dresser (highlighted by a green box).\n(A) mat\n(B) dresser" }, { "from": "gpt", "value": "(B) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896096_144154789101541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to appliance (highlighted by a red box), pillow (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670040_32864822748833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to toy (highlighted by a red box), shelf (highlighted by a blue box) or drawer (highlighted by a green box)?\n(A) shelf\n(B) drawer" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115624_3651086696958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, box (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) box\n(B) bottle" }, { "from": "gpt", "value": "(A) box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334039_278769015669083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, shelf (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) shelf\n(B) lamp" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204341_14960195460791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, houseplant (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) houseplant\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47431107_348278576176000_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the toilet paper (highlighted by a red box)? Choose among these: toilet paper (highlighted by a blue box) or fancy dress (highlighted by a green box).\n(A) toilet paper\n(B) fancy dress" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332207_264545769612958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window screen (highlighted by a red box) or window screen (highlighted by a blue box)?\n(A) window screen\n(B) window screen" }, { "from": "gpt", "value": "(B) window screen" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018874_653430080391583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, tableware (highlighted by a red box) or tableware (highlighted by a blue box)?\n(A) tableware\n(B) tableware" }, { "from": "gpt", "value": "(A) tableware" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670250_63497117610625_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, table (highlighted by a red box) or table (highlighted by a blue box)?\n(A) table\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115127_84788937578250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, book (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) book\n(B) picture frame" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358700_5162657586291_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from sink (highlighted by a red box)? tap (highlighted by a blue box) or toiletry (highlighted by a green box)?\n(A) tap\n(B) toiletry" }, { "from": "gpt", "value": "(A) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895610_469766052800750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to curtain (highlighted by a red box)? Choose from dresser (highlighted by a blue box) and file cabinet (highlighted by a green box).\n(A) dresser\n(B) file cabinet" }, { "from": "gpt", "value": "(A) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331277_13094345024791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bottle (highlighted by a red box) or animal (highlighted by a blue box)?\n(A) bottle\n(B) animal" }, { "from": "gpt", "value": "(B) animal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828596_104228749081958_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from chest of drawers (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899630_229939565073750_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796227_2457413869833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, desk (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) desk\n(B) radiator" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828442_91336130364000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, coffee table (highlighted by a red box) or table (highlighted by a blue box)?\n(A) coffee table\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115424_4973114428500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to bath (highlighted by a red box)? Select from screen door (highlighted by a blue box) and toilet paper (highlighted by a green box).\n(A) screen door\n(B) toilet paper" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331132_174241547874541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, houseplant (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) houseplant\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331010_181976793695083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649399_9675166348708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, fireplace (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) fireplace\n(B) furniture" }, { "from": "gpt", "value": "(A) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332481_338833199520833_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) curtain\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444767_81462871878500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the window blind (highlighted by a red box)? Choose among these: swivel chair (highlighted by a blue box) or radiator (highlighted by a green box).\n(A) swivel chair\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260891_8639003520750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, soap (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) soap\n(B) electric outlet" }, { "from": "gpt", "value": "(A) soap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898236_167764727821833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from desk (highlighted by a red box)? Choose from chair (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) chair\n(B) curtain" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332562_905906239596041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, umbrella (highlighted by a red box) or door handle (highlighted by a blue box)?\n(A) umbrella\n(B) door handle" }, { "from": "gpt", "value": "(A) umbrella" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897960_216190628919375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, television (highlighted by a red box) or table (highlighted by a blue box)?\n(A) television\n(B) table" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204533_2110925772000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to fireplace (highlighted by a red box), animal (highlighted by a blue box) or mirror (highlighted by a green box)?\n(A) animal\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670023_32268602869000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or fruit (highlighted by a blue box)?\n(A) chair\n(B) fruit" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828149_73329398718041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to tile (highlighted by a red box)? Select from furniture (highlighted by a blue box) and dog bed (highlighted by a green box).\n(A) furniture\n(B) dog bed" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358328_19165065013500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of billiard table (annotated by the red box) in reference to cue? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204304_15100173496583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, magazine (highlighted by a red box) or table (highlighted by a blue box)?\n(A) magazine\n(B) table" }, { "from": "gpt", "value": "(A) magazine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796745_28738070361375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) table\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663226_66746067796207_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, bottle (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) bottle\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332321_390758968997958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from stool (highlighted by a red box), round table (highlighted by a blue box) or round table (highlighted by a green box)?\n(A) round table\n(B) round table" }, { "from": "gpt", "value": "(A) round table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358729_6605222899750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the table (highlighted by a red box)? floral arrangement (highlighted by a blue box) or selfie (highlighted by a green box).\n(A) floral arrangement\n(B) selfie" }, { "from": "gpt", "value": "(A) floral arrangement" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447275_408615600476541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bay window (highlighted by a red box) or door (highlighted by a blue box)?\n(A) bay window\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898037_222234826840041_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from dish washer (highlighted by a red box)? washing machine (highlighted by a blue box) or glass door (highlighted by a green box)?\n(A) washing machine\n(B) glass door" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444696_72540776745250_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to cabinetry (highlighted by a red box)? faucet (highlighted by a blue box) or cardboard box (highlighted by a green box).\n(A) faucet\n(B) cardboard box" }, { "from": "gpt", "value": "(B) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796752_29830766640750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899489_197728540129750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from plant (highlighted by a red box)? Choose among these: plant (highlighted by a blue box) or chair (highlighted by a green box).\n(A) plant\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897482_112616749036875_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458634_127439881291666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, swivel chair (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) swivel chair\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899284_885328351663333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, appliance (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332066_250055178406416_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, furniture (highlighted by a red box) or door (highlighted by a blue box)?\n(A) furniture\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260877_7425149005666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, picture frame (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) picture frame\n(B) basket" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739459_51701589914333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to studio couch (highlighted by a red box)? swivel chair (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) swivel chair\n(B) pillow" }, { "from": "gpt", "value": "(A) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333828_53363457393750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from cleaning product (highlighted by a red box), cleaning product (highlighted by a blue box) or mouthwash (highlighted by a green box)?\n(A) cleaning product\n(B) mouthwash" }, { "from": "gpt", "value": "(B) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670003_29915978721583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from appliance (highlighted by a red box), cabinetry (highlighted by a blue box) or window (highlighted by a green box)?\n(A) cabinetry\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896482_23940115513000_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to pillow (highlighted by a red box), door (highlighted by a blue box) or desk (highlighted by a green box)?\n(A) door\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115174_104174749436208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, door (highlighted by a red box) or toilet (highlighted by a blue box)?\n(A) door\n(B) toilet" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739344_46036735015625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from door (highlighted by a red box)? rail (highlighted by a blue box) or laundry (highlighted by a green box)?\n(A) rail\n(B) laundry" }, { "from": "gpt", "value": "(A) rail" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358225_9581339331583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, curtain (highlighted by a red box) or barn door (highlighted by a blue box)?\n(A) curtain\n(B) barn door" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895593_1161492183237083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to appliance (highlighted by a red box), window sill (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) window sill\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334935_663024891952208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261158_688910806333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window (highlighted by a red box)? Select from bay window (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) bay window\n(B) curtain" }, { "from": "gpt", "value": "(A) bay window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670016_30459984365333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from side table (highlighted by a red box)? toy (highlighted by a blue box) or glass door (highlighted by a green box)?\n(A) toy\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458561_128045224444125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, washing machine (highlighted by a red box) or hardwood (highlighted by a blue box)?\n(A) washing machine\n(B) hardwood" }, { "from": "gpt", "value": "(B) hardwood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895960_133571867645750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chair (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) chair\n(B) pillow" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430294_187664461128625_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from table (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and furniture (highlighted by a green box).\n(A) picture frame\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739641_2249852137291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, tap (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) tap\n(B) tap" }, { "from": "gpt", "value": "(A) tap" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898587_184463773164416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from pillow (highlighted by a red box)? glass door (highlighted by a blue box) or table (highlighted by a green box)?\n(A) glass door\n(B) table" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358362_16274162109916_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358278_9008914782958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from picture frame (highlighted by a red box)? Choose among these: screen door (highlighted by a blue box) or tableware (highlighted by a green box).\n(A) screen door\n(B) tableware" }, { "from": "gpt", "value": "(B) tableware" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332473_886534176029541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896469_21810093818583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from stairwell (highlighted by a red box)? Choose from toilet bowl (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) toilet bowl\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430677_326576078053958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of chair (annotated by the red box) and table in the image provided, where is chair (annotated by the red box) located with respect to the staircase? Select from the following choices.\"\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334001_51176142217041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669896_11035796806250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, cabinetry (highlighted by a red box) or faucet (highlighted by a blue box)?\n(A) cabinetry\n(B) faucet" }, { "from": "gpt", "value": "(B) faucet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430983_101545527368500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, furniture (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) furniture\n(B) mat" }, { "from": "gpt", "value": "(B) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331378_198315089651250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from toy (highlighted by a red box)? Choose among these: toy (highlighted by a blue box) or blanket (highlighted by a green box).\n(A) toy\n(B) blanket" }, { "from": "gpt", "value": "(B) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261289_15910358182625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, toy (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) toy\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430298_187439152478166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, book (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) book\n(B) shelf" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430982_101696532707291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, shelf (highlighted by a red box) or shelf (highlighted by a blue box)?\n(A) shelf\n(B) shelf" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739276_42787460235541_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, desk (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) desk\n(B) mat" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662870_14522378671625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table (highlighted by a red box) or window (highlighted by a blue box)?\n(A) table\n(B) window" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895962_406759191539791_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, table (highlighted by a red box) or bean bag chair (highlighted by a blue box)?\n(A) table\n(B) bean bag chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899030_643062570958083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from toy (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and chair (highlighted by a green box).\n(A) pillow\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445476_152285786811125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is door (annotated by the red box) located relative to table? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018552_830391421915166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to candle holder (highlighted by a red box)? clock (highlighted by a blue box) or chest of drawers (highlighted by a green box).\n(A) clock\n(B) chest of drawers" }, { "from": "gpt", "value": "(A) clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446485_355746355181375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, furniture (highlighted by a red box) or dog bed (highlighted by a blue box)?\n(A) furniture\n(B) dog bed" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332812_48061930383041_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, cardboard box (highlighted by a red box) or journal (highlighted by a blue box)?\n(A) cardboard box\n(B) journal" }, { "from": "gpt", "value": "(B) journal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333268_21924313040625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, oven (highlighted by a red box) or basket (highlighted by a blue box)?\n(A) oven\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332810_48190827670958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cleaning product (highlighted by a red box)? Choose from window (highlighted by a blue box) and bottle (highlighted by a green box).\n(A) window\n(B) bottle" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458202_74751063771958_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther to the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331148_179367090318791_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, chest of drawers (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) chest of drawers\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897818_132722689125166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, lamp (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) lamp\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898261_697064526878083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, lamp (highlighted by a red box) or table (highlighted by a blue box)?\n(A) lamp\n(B) table" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331589_15953278112166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from animal (highlighted by a red box), book (highlighted by a blue box) or book (highlighted by a green box)?\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796366_10526439161666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from stool (highlighted by a red box), table (highlighted by a blue box) or fireplace (highlighted by a green box)?\n(A) table\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204820_28635215850666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from bookcase (highlighted by a red box)? furniture (highlighted by a blue box) or window (highlighted by a green box)?\n(A) furniture\n(B) window" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115227_95962836163625_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, remote (highlighted by a red box) or remote (highlighted by a blue box)?\n(A) remote\n(B) remote" }, { "from": "gpt", "value": "(B) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899060_648290548222958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, sink (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) sink\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899489_197732555134833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, toilet (highlighted by a red box) or changing table (highlighted by a blue box)?\n(A) toilet\n(B) changing table" }, { "from": "gpt", "value": "(A) toilet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796568_16185679410416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the pillow (highlighted by a red box)? Choose among these: pillow (highlighted by a blue box) or table (highlighted by a green box).\n(A) pillow\n(B) table" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446446_82376119184458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to oven (highlighted by a red box)? Select from coffee machine (highlighted by a blue box) and drawer (highlighted by a green box).\n(A) coffee machine\n(B) drawer" }, { "from": "gpt", "value": "(B) drawer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331942_164717518188833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from door (highlighted by a red box)? plant (highlighted by a blue box) or door (highlighted by a green box)?\n(A) plant\n(B) door" }, { "from": "gpt", "value": "(A) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670244_63613302809583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, footwear (highlighted by a red box) or shoe (highlighted by a blue box)?\n(A) footwear\n(B) shoe" }, { "from": "gpt", "value": "(B) shoe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204291_14432091462041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to laundry (highlighted by a red box)? material (highlighted by a blue box) or laundry (highlighted by a green box).\n(A) material\n(B) laundry" }, { "from": "gpt", "value": "(B) laundry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898984_824366785406625_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739740_3736102193833_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from pillow (highlighted by a red box)? shelf (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) shelf\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446057_79919956392208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to passage (highlighted by a red box)? Choose from path (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) path\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445613_56619815690291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, pillow (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) pillow\n(B) pillow" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828449_91301227550250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, picture frame (highlighted by a red box) or bed (highlighted by a blue box)?\n(A) picture frame\n(B) bed" }, { "from": "gpt", "value": "(B) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663322_77643667649833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from window screen (highlighted by a red box)? Select from table (highlighted by a blue box) and window (highlighted by a green box).\n(A) table\n(B) window" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898984_824247401198000_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, pillow (highlighted by a red box) or sheet (highlighted by a blue box)?\n(A) pillow\n(B) sheet" }, { "from": "gpt", "value": "(B) sheet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669948_15362236270333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from television (highlighted by a red box)? chest of drawers (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) chest of drawers\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828493_101864292215041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or home appliance (highlighted by a blue box)?\n(A) cabinetry\n(B) home appliance" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333665_131866205385375_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898586_184274181565916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhere is chair (annotated by the red box) located in relation to tray in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261294_16240841427291_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to shutter (highlighted by a red box)? Choose from window sill (highlighted by a blue box) and swivel chair (highlighted by a green box).\n(A) window sill\n(B) swivel chair" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662995_30713595779083_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from hole (highlighted by a red box)? Choose among these: bath (highlighted by a blue box) or shower (highlighted by a green box).\n(A) bath\n(B) shower" }, { "from": "gpt", "value": "(A) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899236_880490331906500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, furniture (highlighted by a red box) or balloon (highlighted by a blue box)?\n(A) furniture\n(B) balloon" }, { "from": "gpt", "value": "(B) balloon" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662806_13578879085500_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to side table (highlighted by a red box)? Select from window screen (highlighted by a blue box) and table (highlighted by a green box).\n(A) window screen\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739680_580306931958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, person (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) person\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48017998_458310220934500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from stool (highlighted by a red box), stool (highlighted by a blue box) or vegetation (highlighted by a green box)?\n(A) stool\n(B) vegetation" }, { "from": "gpt", "value": "(B) vegetation" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896358_18593407401416_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895797_680636395230875_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the picture frame (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334621_385433924888916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from pillow (highlighted by a red box)? radiator (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) radiator\n(B) pillow" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115394_3352861593208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of cabinetry (annotated by the red box) in reference to tomato?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896063_132116990520833_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to magazine (highlighted by a red box)? Select from cardboard box (highlighted by a blue box) and glass door (highlighted by a green box).\n(A) cardboard box\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649639_39687449748125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, oven (highlighted by a red box) or beach towel (highlighted by a blue box)?\n(A) oven\n(B) beach towel" }, { "from": "gpt", "value": "(B) beach towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332044_207165383715750_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, furniture (highlighted by a red box) or bronze statue (highlighted by a blue box)?\n(A) furniture\n(B) bronze statue" }, { "from": "gpt", "value": "(B) bronze statue" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458260_74307042943166_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from chair (highlighted by a red box)? Choose from book (highlighted by a blue box) and book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739426_191882605017291_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to sculpture (highlighted by a red box)? Choose from window (highlighted by a blue box) and giraffe (highlighted by a green box).\n(A) window\n(B) giraffe" }, { "from": "gpt", "value": "(B) giraffe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897720_114154638243250_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430251_182233989572333_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, computer monitor (highlighted by a red box) or remote (highlighted by a blue box)?\n(A) computer monitor\n(B) remote" }, { "from": "gpt", "value": "(B) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261569_76327334643666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from home appliance (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or glass box (highlighted by a green box).\n(A) cabinetry\n(B) glass box" }, { "from": "gpt", "value": "(B) glass box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670134_39910569149083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, bath towel (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) bath towel\n(B) toiletry" }, { "from": "gpt", "value": "(A) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895587_1160113029854791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, picture frame (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) picture frame\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828340_78903432608208_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, studio couch (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) studio couch\n(B) pillow" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334958_667546376971958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, book (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) book\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897409_102977183281083_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, cabinetry (highlighted by a red box) or microwave oven (highlighted by a blue box)?\n(A) cabinetry\n(B) microwave oven" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444754_80981157649708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from document (highlighted by a red box)? control (highlighted by a blue box) or furniture (highlighted by a green box)?\n(A) control\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739414_191345566684083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from table lamp (highlighted by a red box), stool (highlighted by a blue box) or writing desk (highlighted by a green box)?\n(A) stool\n(B) writing desk" }, { "from": "gpt", "value": "(A) stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115304_119544224502125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to window (highlighted by a red box)? Choose from person (highlighted by a blue box) and door (highlighted by a green box).\n(A) person\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334147_142777234060875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from cabinetry (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) book\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445955_130078442623458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from pillow (highlighted by a red box)? studio couch (highlighted by a blue box) or footrest (highlighted by a green box)?\n(A) studio couch\n(B) footrest" }, { "from": "gpt", "value": "(B) footrest" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828504_102354067849541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to footwear (highlighted by a red box)? chair (highlighted by a blue box) or footwear (highlighted by a green box).\n(A) chair\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899202_186812872029916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) chair\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649399_9599163079916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, bed (highlighted by a red box) or footwear (highlighted by a blue box)?\n(A) bed\n(B) footwear" }, { "from": "gpt", "value": "(B) footwear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261686_3791952183875_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from picture frame (highlighted by a red box)? Choose from pillow (highlighted by a blue box) and clothing (highlighted by a green box).\n(A) pillow\n(B) clothing" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358168_61072035755500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from picture frame (highlighted by a red box), coffee table (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) coffee table\n(B) picture frame" }, { "from": "gpt", "value": "(A) coffee table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429728_19241329575958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to toiletry (highlighted by a red box)? Choose from notepad (highlighted by a blue box) and desk (highlighted by a green box).\n(A) notepad\n(B) desk" }, { "from": "gpt", "value": "(A) notepad" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334459_100790195957125_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261289_15896363712708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) door\n(B) pillow" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898448_3286284652500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cleaning product (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) cleaning product\n(B) bottle" }, { "from": "gpt", "value": "(A) cleaning product" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430442_714455890083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, table (highlighted by a red box) or meal (highlighted by a blue box)?\n(A) table\n(B) meal" }, { "from": "gpt", "value": "(B) meal" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260952_6038294556250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, curtain (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) curtain\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896247_7591091263958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, light fixture (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) light fixture\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663255_74980370300333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018334_116216998511958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from swivel chair (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or cabinetry (highlighted by a green box).\n(A) appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430795_60892068511333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) furniture\n(B) furniture" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331771_8440617074207_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333785_48913968165166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, glass jar (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) glass jar\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896252_7998939316250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from cleaning product (highlighted by a red box)? Choose among these: bathroom cabinet (highlighted by a blue box) or tap (highlighted by a green box).\n(A) bathroom cabinet\n(B) tap" }, { "from": "gpt", "value": "(A) bathroom cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47330990_177125086962250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, dresser (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) dresser\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331627_20070032053916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from oven (highlighted by a red box)? Choose from kitchen appliance (highlighted by a blue box) and pot/pan (highlighted by a green box).\n(A) kitchen appliance\n(B) pot/pan" }, { "from": "gpt", "value": "(B) pot/pan" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429870_14324572781750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334615_385597624935833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or tray (highlighted by a blue box)?\n(A) chair\n(B) tray" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115129_85569045214708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to sink (highlighted by a red box)? bottle (highlighted by a blue box) or bathtub (highlighted by a green box).\n(A) bottle\n(B) bathtub" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115227_95910741197333_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the farthest from the observer?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260952_6026299299083_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the door (highlighted by a red box)? Choose among these: furniture (highlighted by a blue box) or mirror (highlighted by a green box).\n(A) furniture\n(B) mirror" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430828_67800259767041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, lamp (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) lamp\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895911_111560848373541_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to basket container (highlighted by a red box)? Choose from basket container (highlighted by a blue box) and basket (highlighted by a green box).\n(A) basket container\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430808_64026194218875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, window (highlighted by a red box) or mat (highlighted by a blue box)?\n(A) window\n(B) mat" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331133_175746031690958_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the bath towel (highlighted by a red box)? Choose among these: toiletry (highlighted by a blue box) or sink (highlighted by a green box).\n(A) toiletry\n(B) sink" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261281_14384851325791_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358268_7163460711750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from countertop (highlighted by a red box)? Select from appliance (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897480_471006924863166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to chair (highlighted by a red box)? Choose from chair (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) chair\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332557_904952564363583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, cardboard box (highlighted by a red box) or waste container (highlighted by a blue box)?\n(A) cardboard box\n(B) waste container" }, { "from": "gpt", "value": "(A) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333292_26342831171500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of plywood (annotated by the red box) in relation to plywood? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446495_357653032263166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, toiletry (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331365_195092681153916_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bed (highlighted by a red box) or nightstand (highlighted by a blue box)?\n(A) bed\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444574_31871795199125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, cabinetry (highlighted by a red box) or kitchen appliance (highlighted by a blue box)?\n(A) cabinetry\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458286_76240030732916_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from curtain (highlighted by a red box)? Choose among these: light fixture (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) light fixture\n(B) curtain" }, { "from": "gpt", "value": "(A) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895868_107566775389041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from book (highlighted by a red box)? studio couch (highlighted by a blue box) or book (highlighted by a green box)?\n(A) studio couch\n(B) book" }, { "from": "gpt", "value": "(A) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898052_223255122217708_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table lamp (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358220_9338056825375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, door (highlighted by a red box) or door (highlighted by a blue box)?\n(A) door\n(B) door" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261339_23913449218500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from toaster (highlighted by a red box)? Choose from home appliance (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) home appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334213_105846988659375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, chair (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) chair\n(B) desk" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895860_489209566155208_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669927_14216969279708_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to desk (highlighted by a red box)? book (highlighted by a blue box) or shelf (highlighted by a green box).\n(A) book\n(B) shelf" }, { "from": "gpt", "value": "(B) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662950_24238426162041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the shoe (highlighted by a red box)? Choose among these: shoe (highlighted by a blue box) or shoe (highlighted by a green box).\n(A) shoe\n(B) shoe" }, { "from": "gpt", "value": "(A) shoe" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828393_94637896281208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is lamp (annotated by the red box) located in relation to window in the image? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796210_1410856395916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, curtain (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) curtain\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018872_653529190250500_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which of the following is the closest to the observer?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896247_7615081306583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, tripod (highlighted by a red box) or door (highlighted by a blue box)?\n(A) tripod\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445799_67035808594375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, teddy bear (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) teddy bear\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897455_469647461119125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, table (highlighted by a red box) or coffee table (highlighted by a blue box)?\n(A) table\n(B) coffee table" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430246_182485587743083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, desk (highlighted by a red box) or swivel chair (highlighted by a blue box)?\n(A) desk\n(B) swivel chair" }, { "from": "gpt", "value": "(B) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828554_101407017083666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from fridge (highlighted by a red box)? Choose from poster (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) poster\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897871_341003482290083_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to light switch (highlighted by a red box)? light switch (highlighted by a blue box) or light switch (highlighted by a green box).\n(A) light switch\n(B) light switch" }, { "from": "gpt", "value": "(A) light switch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261172_1500060765333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), round table (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) round table\n(B) chair" }, { "from": "gpt", "value": "(A) round table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334887_622572385033833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the bed (highlighted by a red box)? bed (highlighted by a blue box) or pillow (highlighted by a green box).\n(A) bed\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261382_26776705116833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, electric outlet (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) electric outlet\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018760_15065350668916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to window (highlighted by a red box)? Select from houseplant (highlighted by a blue box) and houseplant (highlighted by a green box).\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444791_51711072033333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of towel (annotated by the red box) in relation to door handle?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430236_181819975098791_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to mouthwash (highlighted by a red box), product (highlighted by a blue box) or shaving cream (highlighted by a green box)?\n(A) product\n(B) shaving cream" }, { "from": "gpt", "value": "(B) shaving cream" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828311_76432531650208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the table (highlighted by a red box)? Choose among these: mat (highlighted by a blue box) or table (highlighted by a green box).\n(A) mat\n(B) table" }, { "from": "gpt", "value": "(A) mat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204376_18213724714208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, clock (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) clock\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018025_459862848839916_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from sticker (highlighted by a red box)? Choose from sticker (highlighted by a blue box) and refrigerator (highlighted by a green box).\n(A) sticker\n(B) refrigerator" }, { "from": "gpt", "value": "(A) sticker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897560_473401194419250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or file cabinet (highlighted by a blue box)?\n(A) chair\n(B) file cabinet" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332398_401529416410541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from cabinetry (highlighted by a red box)? home appliance (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) home appliance\n(B) cabinetry" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458202_74733071223666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from window sill (highlighted by a red box)? curtain (highlighted by a blue box) or pillow (highlighted by a green box)?\n(A) curtain\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897653_147009673915166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, table (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) table\n(B) appliance" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458225_76827772701208_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the drum (highlighted by a red box)? guitar (highlighted by a blue box) or radiator (highlighted by a green box).\n(A) guitar\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896009_137114268028291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, table lamp (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) table lamp\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895908_110730948339333_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, bed (highlighted by a red box) or nightstand (highlighted by a blue box)?\n(A) bed\n(B) nightstand" }, { "from": "gpt", "value": "(B) nightstand" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333778_48285635229541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from book (highlighted by a red box)? Select from window sill (highlighted by a blue box) and book (highlighted by a green box).\n(A) window sill\n(B) book" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895637_471651393486875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, lamp (highlighted by a red box) or couch (highlighted by a blue box)?\n(A) lamp\n(B) couch" }, { "from": "gpt", "value": "(B) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332954_21989994445333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897804_131482416513333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chair (highlighted by a red box) or table (highlighted by a blue box)?\n(A) chair\n(B) table" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898959_821211706628166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from electric outlet (highlighted by a red box), projection screen (highlighted by a blue box) or microwave oven (highlighted by a green box)?\n(A) projection screen\n(B) microwave oven" }, { "from": "gpt", "value": "(B) microwave oven" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260938_4890193844666_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), bowl (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) bowl\n(B) chair" }, { "from": "gpt", "value": "(A) bowl" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444719_75442772351208_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898903_817107129024291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, floral arrangement (highlighted by a red box) or bar stool (highlighted by a blue box)?\n(A) floral arrangement\n(B) bar stool" }, { "from": "gpt", "value": "(B) bar stool" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430858_74457487859458_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) furniture\n(B) toiletry" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204780_27250969355000_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, trash bin/can (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) trash bin/can\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261313_22291850443958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or radiator (highlighted by a blue box)?\n(A) chair\n(B) radiator" }, { "from": "gpt", "value": "(B) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649707_47651751582375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, chair (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) chair\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24345808601541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the window screen (highlighted by a red box)? Choose among these: picture frame (highlighted by a blue box) or picture frame (highlighted by a green box).\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663332_77451164330583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) window\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333195_46980039379958_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cabinetry (highlighted by a red box) or window (highlighted by a blue box)?\n(A) cabinetry\n(B) window" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737751027439208_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) furniture\n(B) appliance" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796691_30624349597458_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to picture frame (highlighted by a red box), clothing (highlighted by a blue box) or pants (highlighted by a green box)?\n(A) clothing\n(B) pants" }, { "from": "gpt", "value": "(A) clothing" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663053_38623396611791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or exhaust hood (highlighted by a blue box)?\n(A) chair\n(B) exhaust hood" }, { "from": "gpt", "value": "(B) exhaust hood" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429774_360109524117458_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera taking this photo?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(A) A is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898419_1191040967625_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from window sill (highlighted by a red box)? curtain (highlighted by a blue box) or fireplace (highlighted by a green box)?\n(A) curtain\n(B) fireplace" }, { "from": "gpt", "value": "(B) fireplace" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458219_76171334267208_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from table (highlighted by a red box), balustrade (highlighted by a blue box) or mirror (highlighted by a green box)?\n(A) balustrade\n(B) mirror" }, { "from": "gpt", "value": "(B) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458221_76866973124041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, door (highlighted by a red box) or desk (highlighted by a blue box)?\n(A) door\n(B) desk" }, { "from": "gpt", "value": "(B) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445173_8217923432250_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from toaster (highlighted by a red box)? table lamp (highlighted by a blue box) or curtain (highlighted by a green box)?\n(A) table lamp\n(B) curtain" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670295_63446238910041_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from bulletin board (highlighted by a red box)? Select from vase (highlighted by a blue box) and desktop (highlighted by a green box).\n(A) vase\n(B) desktop" }, { "from": "gpt", "value": "(A) vase" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260895_8752706323625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to bottle (highlighted by a red box)? bathtub (highlighted by a blue box) or bath mat (highlighted by a green box).\n(A) bathtub\n(B) bath mat" }, { "from": "gpt", "value": "(A) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444695_72648582814083_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of furniture (annotated by the red box) in relation to television? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260892_8819511885000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, balustrade (highlighted by a red box) or bath (highlighted by a blue box)?\n(A) balustrade\n(B) bath" }, { "from": "gpt", "value": "(A) balustrade" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662891_19485502951583_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, treadmill (highlighted by a red box) or projection screen (highlighted by a blue box)?\n(A) treadmill\n(B) projection screen" }, { "from": "gpt", "value": "(A) treadmill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332158_260219734768833_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, furniture (highlighted by a red box) or wrapping paper (highlighted by a blue box)?\n(A) furniture\n(B) wrapping paper" }, { "from": "gpt", "value": "(A) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358234_9894761924041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, electric outlet (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) electric outlet\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899284_885332366660541_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or bottle (highlighted by a blue box)?\n(A) picture frame\n(B) bottle" }, { "from": "gpt", "value": "(B) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458219_76155340886166_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from radiator (highlighted by a red box)? lamp (highlighted by a blue box) or cardboard box (highlighted by a green box)?\n(A) lamp\n(B) cardboard box" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429804_737623828705583_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to bottle (highlighted by a red box)? Choose from home appliance (highlighted by a blue box) and kitchen appliance (highlighted by a green box).\n(A) home appliance\n(B) kitchen appliance" }, { "from": "gpt", "value": "(B) kitchen appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429764_358138651640791_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, pad (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) pad\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358386_19178753446458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to chair (highlighted by a red box)? Choose from curtain (highlighted by a blue box) and curtain (highlighted by a green box).\n(A) curtain\n(B) curtain" }, { "from": "gpt", "value": "(A) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445869_71889585623500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, candle holder (highlighted by a red box) or candle holder (highlighted by a blue box)?\n(A) candle holder\n(B) candle holder" }, { "from": "gpt", "value": "(A) candle holder" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897863_340968280012125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the curtain (highlighted by a red box)? light (highlighted by a blue box) or bay window (highlighted by a green box).\n(A) light\n(B) bay window" }, { "from": "gpt", "value": "(B) bay window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898621_757980813430500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to countertop (highlighted by a red box)? Select from appliance (highlighted by a blue box) and appliance (highlighted by a green box).\n(A) appliance\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899654_233428274193916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the picture frame (highlighted by a red box)? Choose among these: door (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) door\n(B) curtain" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458633_127562282865333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, remote (highlighted by a red box) or table (highlighted by a blue box)?\n(A) remote\n(B) table" }, { "from": "gpt", "value": "(A) remote" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899513_197637044677416_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table (highlighted by a red box) or lamp (highlighted by a blue box)?\n(A) table\n(B) lamp" }, { "from": "gpt", "value": "(B) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898458_156625693934375_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261251_12649495729500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, studio couch (highlighted by a red box) or table (highlighted by a blue box)?\n(A) studio couch\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429799_737872528382833_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to table (highlighted by a red box)? Choose from couch (highlighted by a blue box) and table (highlighted by a green box).\n(A) couch\n(B) table" }, { "from": "gpt", "value": "(A) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332705_109838912975958_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, door (highlighted by a red box) or clothing (highlighted by a blue box)?\n(A) door\n(B) clothing" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204856_1705124030583_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897870_529950969698875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, desk (highlighted by a red box) or houseplant (highlighted by a blue box)?\n(A) desk\n(B) houseplant" }, { "from": "gpt", "value": "(A) desk" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739276_42833474471958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, paperback book (highlighted by a red box) or book (highlighted by a blue box)?\n(A) paperback book\n(B) book" }, { "from": "gpt", "value": "(A) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018608_633230515300791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from bottle (highlighted by a red box)? television (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) television\n(B) chair" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444579_32085808214125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the kitchen appliance (highlighted by a red box)? Choose among these: appliance (highlighted by a blue box) or coffee table (highlighted by a green box).\n(A) appliance\n(B) coffee table" }, { "from": "gpt", "value": "(A) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899632_229990161662916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, blanket (highlighted by a red box) or concrete (highlighted by a blue box)?\n(A) blanket\n(B) concrete" }, { "from": "gpt", "value": "(A) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333292_26405039017500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of towel (annotated by the red box) in relation to towel? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(A) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204335_15098407465958_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, nightstand (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) nightstand\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445585_283538767274416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, nightstand (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) nightstand\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204739_24143838895291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, chest of drawers (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) chest of drawers\n(B) table lamp" }, { "from": "gpt", "value": "(B) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897755_117594114884125_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the book (highlighted by a red box)? Choose among these: stove (highlighted by a blue box) or book (highlighted by a green box).\n(A) stove\n(B) book" }, { "from": "gpt", "value": "(A) stove" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446142_140940263475916_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from storage box (highlighted by a red box)? cardboard box (highlighted by a blue box) or table (highlighted by a green box)?\n(A) cardboard box\n(B) table" }, { "from": "gpt", "value": "(A) cardboard box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430236_181830470829250_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhere is curtain (annotated by the red box) located in relation to curtain in the image?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333603_75417376560833_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444787_50386308077666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the microwave oven (highlighted by a red box)? Choose among these: cabinetry (highlighted by a blue box) or window screen (highlighted by a green box).\n(A) cabinetry\n(B) window screen" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018445_526692195914124_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, light (highlighted by a red box) or window (highlighted by a blue box)?\n(A) light\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333659_130350371977291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bookcase (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) bookcase\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796463_3631707081166_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to bottle (highlighted by a red box), cleaning product (highlighted by a blue box) or bathtub (highlighted by a green box)?\n(A) cleaning product\n(B) bathtub" }, { "from": "gpt", "value": "(B) bathtub" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115240_97896869121375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of table (annotated by the red box) in reference to studio couch? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796446_607714962333_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(A) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739646_2224146105166_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, chest of drawers (highlighted by a red box) or gift box (highlighted by a blue box)?\n(A) chest of drawers\n(B) gift box" }, { "from": "gpt", "value": "(B) gift box" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358170_62318534317750_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from houseplant (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and door (highlighted by a green box).\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204876_3590337920666_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from toilet (highlighted by a red box)? toilet paper (highlighted by a blue box) or toilet paper (highlighted by a green box)?\n(A) toilet paper\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670299_63496735611750_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the furniture (highlighted by a red box)? light switch (highlighted by a blue box) or door (highlighted by a green box).\n(A) light switch\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895871_489442484355958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cabinetry (highlighted by a red box)? Choose from coffee cup (highlighted by a blue box) and electric outlet (highlighted by a green box).\n(A) coffee cup\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896009_137132260528249_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, lamp (highlighted by a red box) or table (highlighted by a blue box)?\n(A) lamp\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261541_74313723331875_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from christmas tree (highlighted by a red box)? Select from mirror (highlighted by a blue box) and toy (highlighted by a green box).\n(A) mirror\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204741_25164088478125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, picture frame (highlighted by a red box) or picture frame (highlighted by a blue box)?\n(A) picture frame\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796475_4324732897500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to table (highlighted by a red box)? Choose from remote control (highlighted by a blue box) and pillow (highlighted by a green box).\n(A) remote control\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828320_76191726910125_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, television (highlighted by a red box) or plain (highlighted by a blue box)?\n(A) television\n(B) plain" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261713_1482731099250_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is farther from the camera taking this photo?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896083_144021894174208_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window screen (highlighted by a red box), pillow (highlighted by a blue box) or window (highlighted by a green box)?\n(A) pillow\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898958_821335289387500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from electric outlet (highlighted by a red box)? home appliance (highlighted by a blue box) or appliance (highlighted by a green box)?\n(A) home appliance\n(B) appliance" }, { "from": "gpt", "value": "(A) home appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204724_23546527298083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, chair (highlighted by a red box) or couch (highlighted by a blue box)?\n(A) chair\n(B) couch" }, { "from": "gpt", "value": "(B) couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895449_129287091245333_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the toothbrush (highlighted by a red box)? mouthwash (highlighted by a blue box) or mouthwash (highlighted by a green box).\n(A) mouthwash\n(B) mouthwash" }, { "from": "gpt", "value": "(B) mouthwash" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018331_116127101421458_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to furniture (highlighted by a red box)? Select from handbag (highlighted by a blue box) and concrete (highlighted by a green box).\n(A) handbag\n(B) concrete" }, { "from": "gpt", "value": "(B) concrete" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333493_62527689660333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to curtain (highlighted by a red box)? balloon (highlighted by a blue box) or curtain (highlighted by a green box).\n(A) balloon\n(B) curtain" }, { "from": "gpt", "value": "(A) balloon" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445040_1753443563041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from person (highlighted by a red box)? Select from fireplace (highlighted by a blue box) and table (highlighted by a green box).\n(A) fireplace\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896247_7601087115791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from picture frame (highlighted by a red box)? Select from shelf (highlighted by a blue box) and bed (highlighted by a green box).\n(A) shelf\n(B) bed" }, { "from": "gpt", "value": "(A) shelf" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796752_29852757944583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, curtain (highlighted by a red box) or window (highlighted by a blue box)?\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333657_130120981798833_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, toy (highlighted by a red box) or toy (highlighted by a blue box)?\n(A) toy\n(B) toy" }, { "from": "gpt", "value": "(B) toy" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115299_119565132903000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from shelf (highlighted by a red box), curtain (highlighted by a blue box) or bay window (highlighted by a green box)?\n(A) curtain\n(B) bay window" }, { "from": "gpt", "value": "(B) bay window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897587_134961353164583_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer, lamp (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) lamp\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445619_56382414040666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, home appliance (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) home appliance\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204305_15290277772750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the book (highlighted by a red box)? Choose among these: table (highlighted by a blue box) or magazine (highlighted by a green box).\n(A) table\n(B) magazine" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796492_1614072194333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), changing table (highlighted by a blue box) or cupboard (highlighted by a green box)?\n(A) changing table\n(B) cupboard" }, { "from": "gpt", "value": "(B) cupboard" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42447216_212551024623000_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, cabinetry (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670299_63484740353625_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, computer monitor (highlighted by a red box) or power outlet (highlighted by a blue box)?\n(A) computer monitor\n(B) power outlet" }, { "from": "gpt", "value": "(A) computer monitor" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204342_14923709890041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, picture frame (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) picture frame\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333873_76255375547583_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to furniture (highlighted by a red box), window (highlighted by a blue box) or window (highlighted by a green box)?\n(A) window\n(B) window" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649397_9467265237041_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the curtain (highlighted by a red box)? Choose among these: fireplace (highlighted by a blue box) or basket (highlighted by a green box).\n(A) fireplace\n(B) basket" }, { "from": "gpt", "value": "(B) basket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334628_386202135008708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from paper towel (highlighted by a red box)? wide (highlighted by a blue box) or waste (highlighted by a green box)?\n(A) wide\n(B) waste" }, { "from": "gpt", "value": "(B) waste" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204741_25194092722458_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to studio couch (highlighted by a red box)? pad (highlighted by a blue box) or table (highlighted by a green box).\n(A) pad\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332778_44592060170333_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, houseplant (highlighted by a red box) or wall clock (highlighted by a blue box)?\n(A) houseplant\n(B) wall clock" }, { "from": "gpt", "value": "(B) wall clock" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430217_180353208534000_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from shelf (highlighted by a red box)? Select from Eiffel tower (highlighted by a blue box) and book (highlighted by a green box).\n(A) Eiffel tower\n(B) book" }, { "from": "gpt", "value": "(A) Eiffel tower" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333298_26668430409291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, bath (highlighted by a red box) or bath towel (highlighted by a blue box)?\n(A) bath\n(B) bath towel" }, { "from": "gpt", "value": "(B) bath towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334655_389738641995041_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is toilet paper (annotated by the red box) located relative to toilet paper? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333674_134265756341583_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears farthest from the camera in this image?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332503_343984977754666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from shelf (highlighted by a red box)? Select from table (highlighted by a blue box) and shelf (highlighted by a green box).\n(A) table\n(B) shelf" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796721_27323875295708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from window (highlighted by a red box), cabinetry (highlighted by a blue box) or picture frame (highlighted by a green box)?\n(A) cabinetry\n(B) picture frame" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332015_200858351329750_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is closer to the camera?\nSelect from the following choices.\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458337_102864722129875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45260889_8625509114166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial relationship of light fixture (annotated by the red box) in relation to plank? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(A) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897948_351394212943708_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, remote control (highlighted by a red box) or coffee cup (highlighted by a blue box)?\n(A) remote control\n(B) coffee cup" }, { "from": "gpt", "value": "(B) coffee cup" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42897709_111984306444875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinetry (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331080_133682683026958_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from couch (highlighted by a red box)? houseplant (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333838_54192779768916_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from table (highlighted by a red box)? Select from beverage (highlighted by a blue box) and picture frame (highlighted by a green box).\n(A) beverage\n(B) picture frame" }, { "from": "gpt", "value": "(B) picture frame" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896209_2281375788875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, countertop (highlighted by a red box) or door (highlighted by a blue box)?\n(A) countertop\n(B) door" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018776_15388991376875_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, where is shower door (annotated by the red box) located relative to screen door? Select from the following\n(A) below\n(B) above" }, { "from": "gpt", "value": "(B) above" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331945_165252130957416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, door (highlighted by a red box) or vanity (highlighted by a blue box)?\n(A) door\n(B) vanity" }, { "from": "gpt", "value": "(B) vanity" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334900_1084406241318041_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, person (highlighted by a red box) or beach towel (highlighted by a blue box)?\n(A) person\n(B) beach towel" }, { "from": "gpt", "value": "(B) beach towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115262_114971662381500_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, door (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) door\n(B) chair" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446450_354697027458708_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to studio couch (highlighted by a red box)? Choose from drawer (highlighted by a blue box) and book (highlighted by a green box).\n(A) drawer\n(B) book" }, { "from": "gpt", "value": "(B) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43895960_133583862675040_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from bottle (highlighted by a red box)? Choose among these: bottle (highlighted by a blue box) or oven (highlighted by a green box).\n(A) bottle\n(B) oven" }, { "from": "gpt", "value": "(A) bottle" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204820_28671218282125_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, chair (highlighted by a red box) or candle (highlighted by a blue box)?\n(A) chair\n(B) candle" }, { "from": "gpt", "value": "(A) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358380_18908844197541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, curtain (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) curtain\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430280_186377166490791_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, cabinetry (highlighted by a red box) or appliance (highlighted by a blue box)?\n(A) cabinetry\n(B) appliance" }, { "from": "gpt", "value": "(B) appliance" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331946_165414531820083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, bottle (highlighted by a red box) or toothpaste (highlighted by a blue box)?\n(A) bottle\n(B) toothpaste" }, { "from": "gpt", "value": "(B) toothpaste" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204474_25087569060625_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the appliance (highlighted by a red box)? fireplace (highlighted by a blue box) or speaker (highlighted by a green box).\n(A) fireplace\n(B) speaker" }, { "from": "gpt", "value": "(B) speaker" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445613_56593809791041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, curtain (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) curtain\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333581_207654026173458_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from chair (highlighted by a red box), table (highlighted by a blue box) or shoulder bag (highlighted by a green box)?\n(A) table\n(B) shoulder bag" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649478_14865540175375_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhere is book (annotated by the red box) located in relation to table in the image?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(A) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334185_354534269521416_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from swivel chair (highlighted by a red box)? cabinetry (highlighted by a blue box) or cardboard box (highlighted by a green box)?\n(A) cabinetry\n(B) cardboard box" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333329_30178834439875_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, washing machine (highlighted by a red box) or tile (highlighted by a blue box)?\n(A) washing machine\n(B) tile" }, { "from": "gpt", "value": "(A) washing machine" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332952_21925404008375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from appliance (highlighted by a red box), lamp (highlighted by a blue box) or bottle (highlighted by a green box)?\n(A) lamp\n(B) bottle" }, { "from": "gpt", "value": "(A) lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662805_13511990236666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to window sill (highlighted by a red box)? bed (highlighted by a blue box) or window (highlighted by a green box).\n(A) bed\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739612_200181839722916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, toilet paper (highlighted by a red box) or toiletry (highlighted by a blue box)?\n(A) toilet paper\n(B) toiletry" }, { "from": "gpt", "value": "(A) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663415_95944870268958_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the magazine (highlighted by a red box)? mattress (highlighted by a blue box) or round table (highlighted by a green box).\n(A) mattress\n(B) round table" }, { "from": "gpt", "value": "(A) mattress" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115619_3175822202375_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nFrom the image's perspective, what is the correct spatial positioning of door (annotated by the red box) in reference to porcelain? Select from the following\n(A) above\n(B) below" }, { "from": "gpt", "value": "(B) below" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42446579_205813447040500_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, swivel chair (highlighted by a red box) or fireplace (highlighted by a blue box)?\n(A) swivel chair\n(B) fireplace" }, { "from": "gpt", "value": "(A) swivel chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739902_15056083660416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, counter (highlighted by a red box) or jug (highlighted by a blue box)?\n(A) counter\n(B) jug" }, { "from": "gpt", "value": "(B) jug" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358225_9617341066875_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is farthest from the camera?\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(B) B is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332398_401563402556125_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, television (highlighted by a red box) or dresser (highlighted by a blue box)?\n(A) television\n(B) dresser" }, { "from": "gpt", "value": "(B) dresser" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261329_24173040806875_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, bed (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) bed\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204493_26411331744791_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point is further to the camera?\nSelect from the following choices.\n(A) A is further\n(B) B is further" }, { "from": "gpt", "value": "(A) A is further" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333331_29901830536416_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, screen door (highlighted by a red box) or towel (highlighted by a blue box)?\n(A) screen door\n(B) towel" }, { "from": "gpt", "value": "(B) towel" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115240_98030880197708_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, curtain (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) curtain\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429798_737329930195250_image_with_points_1.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Which point appears closest to the camera in this image?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333475_58616240354083_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, cabinet (highlighted by a red box) or plywood (highlighted by a blue box)?\n(A) cabinet\n(B) plywood" }, { "from": "gpt", "value": "(A) cabinet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334760_421799542872416_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from pillow (highlighted by a red box)? Choose among these: material (highlighted by a blue box) or material (highlighted by a green box).\n(A) material\n(B) material" }, { "from": "gpt", "value": "(B) material" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332648_369085264840375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from houseplant (highlighted by a red box)? houseplant (highlighted by a blue box) or houseplant (highlighted by a green box)?\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(B) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333053_60102383325166_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) window\n(B) curtain" }, { "from": "gpt", "value": "(B) curtain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670208_54175666394291_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, studio couch (highlighted by a red box) or doormat (highlighted by a blue box)?\n(A) studio couch\n(B) doormat" }, { "from": "gpt", "value": "(B) doormat" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47430599_315416317450125_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from toy (highlighted by a red box)? furniture (highlighted by a blue box) or glass door (highlighted by a green box)?\n(A) furniture\n(B) glass door" }, { "from": "gpt", "value": "(B) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331491_153203624105666_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, mirror (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) mirror\n(B) cabinetry" }, { "from": "gpt", "value": "(A) mirror" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663317_76512775578541_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, cabinetry (highlighted by a red box) or tap (highlighted by a blue box)?\n(A) cabinetry\n(B) tap" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649397_9471263656166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to screen door (highlighted by a red box)? door (highlighted by a blue box) or bulletin board (highlighted by a green box).\n(A) door\n(B) bulletin board" }, { "from": "gpt", "value": "(B) bulletin board" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331089_133747890043083_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, pillow (highlighted by a red box) or table (highlighted by a blue box)?\n(A) pillow\n(B) table" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899003_640694026673083_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to magazine (highlighted by a red box)? Choose from waste container (highlighted by a blue box) and footwear (highlighted by a green box).\n(A) waste container\n(B) footwear" }, { "from": "gpt", "value": "(A) waste container" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333310_28198638312708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the entertainment center (highlighted by a red box)? houseplant (highlighted by a blue box) or plain (highlighted by a green box).\n(A) houseplant\n(B) plain" }, { "from": "gpt", "value": "(B) plain" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895864_489582277328541_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from furniture (highlighted by a red box)? radiator (highlighted by a blue box) or window sill (highlighted by a green box)?\n(A) radiator\n(B) window sill" }, { "from": "gpt", "value": "(B) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896545_30098501757333_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from bedside lamp (highlighted by a red box)? Choose from picture frame (highlighted by a blue box) and door (highlighted by a green box).\n(A) picture frame\n(B) door" }, { "from": "gpt", "value": "(B) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458306_101674886029166_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, television (highlighted by a red box) or guitar (highlighted by a blue box)?\n(A) television\n(B) guitar" }, { "from": "gpt", "value": "(A) television" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898917_816780145973500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, countertop (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) countertop\n(B) cabinetry" }, { "from": "gpt", "value": "(A) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204289_14396389612416_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from silverware (highlighted by a red box), cabinetry (highlighted by a blue box) or exhaust hood (highlighted by a green box)?\n(A) cabinetry\n(B) exhaust hood" }, { "from": "gpt", "value": "(A) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261452_35725952696583_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, window (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) window\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358118_62563383536375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is chair (annotated by the red box) located relative to chair?\n(A) right\n(B) left" }, { "from": "gpt", "value": "(B) left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649774_43610212926958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window sill (highlighted by a red box) or pillow (highlighted by a blue box)?\n(A) window sill\n(B) pillow" }, { "from": "gpt", "value": "(B) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204686_13354374970666_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to stairwell (highlighted by a red box)? Select from towel (highlighted by a blue box) and screen door (highlighted by a green box).\n(A) towel\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332819_48884997071125_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, screen door (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) screen door\n(B) chair" }, { "from": "gpt", "value": "(A) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445584_283400773985791_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the toiletry (highlighted by a red box)? Choose among these: toiletry (highlighted by a blue box) or toiletry (highlighted by a green box).\n(A) toiletry\n(B) toiletry" }, { "from": "gpt", "value": "(B) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333298_26601941220500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, sink (highlighted by a red box) or drawer (highlighted by a blue box)?\n(A) sink\n(B) drawer" }, { "from": "gpt", "value": "(A) sink" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739633_1802576287791_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to dresser (highlighted by a red box)? pillow (highlighted by a blue box) or fan (highlighted by a green box).\n(A) pillow\n(B) fan" }, { "from": "gpt", "value": "(A) pillow" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444721_75341063825375_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, lighting (highlighted by a red box) or mirror (highlighted by a blue box)?\n(A) lighting\n(B) mirror" }, { "from": "gpt", "value": "(A) lighting" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43896075_132579612860208_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, table lamp (highlighted by a red box) or curtain (highlighted by a blue box)?\n(A) table lamp\n(B) curtain" }, { "from": "gpt", "value": "(A) table lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333892_78972163105750_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to paperback book (highlighted by a red box), paperback book (highlighted by a blue box) or paperback book (highlighted by a green box)?\n(A) paperback book\n(B) paperback book" }, { "from": "gpt", "value": "(A) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48018838_649201057287791_image_with_points_0.png", "conversations": [ { "from": "human", "value": "\nTwo points are circled on the image, labeled by A and B beside each circle. Among these points, which one is nearest to the camera?\n(A) A is closer\n(B) B is closer" }, { "from": "gpt", "value": "(B) B is closer" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899936_863430277177750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from lamp (highlighted by a red box)? Choose from cabinetry (highlighted by a blue box) and cabinetry (highlighted by a green box).\n(A) cabinetry\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115217_94978734688708_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from kitchen & dining room table (highlighted by a red box)? pad (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) pad\n(B) chair" }, { "from": "gpt", "value": "(A) pad" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429717_18169245016375_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from cabinetry (highlighted by a red box)? Choose from bottle (highlighted by a blue box) and window (highlighted by a green box).\n(A) bottle\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45663053_38663397433125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from chair (highlighted by a red box)? appliance (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) appliance\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204493_26447517392291_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, toiletries (highlighted by a red box) or toothbrush (highlighted by a blue box)?\n(A) toiletries\n(B) toothbrush" }, { "from": "gpt", "value": "(B) toothbrush" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445205_10759020492250_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, table (highlighted by a red box) or studio couch (highlighted by a blue box)?\n(A) table\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333493_62618602703375_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, houseplant (highlighted by a red box) or coffee cup (highlighted by a blue box)?\n(A) houseplant\n(B) coffee cup" }, { "from": "gpt", "value": "(B) coffee cup" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47204678_12478434415500_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to beige (highlighted by a red box)? throw pillow (highlighted by a blue box) or studio couch (highlighted by a green box).\n(A) throw pillow\n(B) studio couch" }, { "from": "gpt", "value": "(B) studio couch" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332609_363491413532500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the shelf (highlighted by a red box)? Choose among these: book (highlighted by a blue box) or book (highlighted by a green box).\n(A) book\n(B) book" }, { "from": "gpt", "value": "(A) book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445955_130025547659250_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, furniture (highlighted by a red box) or paperback book (highlighted by a blue box)?\n(A) furniture\n(B) paperback book" }, { "from": "gpt", "value": "(B) paperback book" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/49739629_1965675405666_image_with_bbox_7.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to book (highlighted by a red box)? Select from bed (highlighted by a blue box) and plain (highlighted by a green box).\n(A) bed\n(B) plain" }, { "from": "gpt", "value": "(A) bed" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42444695_72665076092333_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from table (highlighted by a red box)? chair (highlighted by a blue box) or chair (highlighted by a green box)?\n(A) chair\n(B) chair" }, { "from": "gpt", "value": "(B) chair" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47429723_17905835422541_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, cabinetry (highlighted by a red box) or plant (highlighted by a blue box)?\n(A) cabinetry\n(B) plant" }, { "from": "gpt", "value": "(B) plant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47115165_88117483915375_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from toilet paper (highlighted by a red box), toilet (highlighted by a blue box) or bath (highlighted by a green box)?\n(A) toilet\n(B) bath" }, { "from": "gpt", "value": "(B) bath" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47895967_406866897063958_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image, window sill (highlighted by a red box) or mug (highlighted by a blue box)?\n(A) window sill\n(B) mug" }, { "from": "gpt", "value": "(A) window sill" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/48458218_76295432907416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is further to the camera, window (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) window\n(B) furniture" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47331430_546002009128166_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to houseplant (highlighted by a red box)? Select from radiator (highlighted by a blue box) and plant (highlighted by a green box).\n(A) radiator\n(B) plant" }, { "from": "gpt", "value": "(A) radiator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828368_92189517425583_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the curtain (highlighted by a red box)? curtain (highlighted by a blue box) or window (highlighted by a green box).\n(A) curtain\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334948_664607900777291_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo, furniture (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) furniture\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42445862_70616797004416_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, table (highlighted by a red box) or electric outlet (highlighted by a blue box)?\n(A) table\n(B) electric outlet" }, { "from": "gpt", "value": "(B) electric outlet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261600_53010903134916_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nIn this image, where is pillow (annotated by the red box) located relative to pillow?\n(A) left\n(B) right" }, { "from": "gpt", "value": "(B) right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45662912_19967747754041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to mirror (highlighted by a red box)? Choose from book (highlighted by a blue box) and bedside lamp (highlighted by a green box).\n(A) book\n(B) bedside lamp" }, { "from": "gpt", "value": "(B) bedside lamp" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47669896_11108701264041_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to window screen (highlighted by a red box)? Choose from studio couch (highlighted by a blue box) and blanket (highlighted by a green box).\n(A) studio couch\n(B) blanket" }, { "from": "gpt", "value": "(B) blanket" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898215_145728674905916_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest to the camera in this image, door (highlighted by a red box) or table lamp (highlighted by a blue box)?\n(A) door\n(B) table lamp" }, { "from": "gpt", "value": "(A) door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899333_715122957229916_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, light (highlighted by a red box) or window blind (highlighted by a blue box)?\n(A) light\n(B) window blind" }, { "from": "gpt", "value": "(A) light" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47332204_264092569980708_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich is farther away from counter top (highlighted by a red box)? radiator (highlighted by a blue box) or refrigerator (highlighted by a green box)?\n(A) radiator\n(B) refrigerator" }, { "from": "gpt", "value": "(B) refrigerator" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898449_3237371083666_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich object is further to the camera taking this photo, toiletry (highlighted by a red box) or shower (highlighted by a blue box)?\n(A) toiletry\n(B) shower" }, { "from": "gpt", "value": "(A) toiletry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47333277_24447800168500_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to houseplant (highlighted by a red box)? houseplant (highlighted by a blue box) or houseplant (highlighted by a green box).\n(A) houseplant\n(B) houseplant" }, { "from": "gpt", "value": "(A) houseplant" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43828552_101538714971750_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from cabinetry (highlighted by a red box)? Select from fruit dish (highlighted by a blue box) and table (highlighted by a green box).\n(A) fruit dish\n(B) table" }, { "from": "gpt", "value": "(B) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47670063_37917512579125_image_with_bbox_6.png", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to window (highlighted by a red box)? window (highlighted by a blue box) or window (highlighted by a green box).\n(A) window\n(B) window" }, { "from": "gpt", "value": "(A) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649720_47900948147041_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, chair (highlighted by a red box) or screen door (highlighted by a blue box)?\n(A) chair\n(B) screen door" }, { "from": "gpt", "value": "(B) screen door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/43649633_39501243633541_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to window (highlighted by a red box), glass door (highlighted by a blue box) or cabinetry (highlighted by a green box)?\n(A) glass door\n(B) cabinetry" }, { "from": "gpt", "value": "(A) glass door" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261406_29856797409208_image_with_bbox_0.png", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest to the observer, door (highlighted by a red box) or cabinetry (highlighted by a blue box)?\n(A) door\n(B) cabinetry" }, { "from": "gpt", "value": "(B) cabinetry" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42899935_863116073979250_image_with_bbox_5.png", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from studio couch (highlighted by a red box)? Choose from light fixture (highlighted by a blue box) and window screen (highlighted by a green box).\n(A) light fixture\n(B) window screen" }, { "from": "gpt", "value": "(A) light fixture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44358406_40727373052500_image_with_bbox_4.png", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to blender (highlighted by a red box), beverage (highlighted by a blue box) or countertop (highlighted by a green box)?\n(A) beverage\n(B) countertop" }, { "from": "gpt", "value": "(B) countertop" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/44796721_27329889585500_image_with_bbox_3.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, bottle (highlighted by a red box) or window (highlighted by a blue box)?\n(A) bottle\n(B) window" }, { "from": "gpt", "value": "(B) window" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/45261096_1336451923291_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest to the camera, table (highlighted by a red box) or chair (highlighted by a blue box)?\n(A) table\n(B) chair" }, { "from": "gpt", "value": "(A) table" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/47334205_103852180091583_image_with_bbox_2.png", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera, furniture (highlighted by a red box) or furniture (highlighted by a blue box)?\n(A) furniture\n(B) furniture" }, { "from": "gpt", "value": "(B) furniture" } ] }, { "image": "/data/shared/Qwen/RefSpatial/3D/image_visual_choice/42898625_757764502494458_image_with_bbox_1.png", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera, water cooler (highlighted by a red box) or toilet paper (highlighted by a blue box)?\n(A) water cooler\n(B) toilet paper" }, { "from": "gpt", "value": "(B) toilet paper" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f4e0bbf8aac640d.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.492, 0.086) come farther from viewer compared to point (0.865, 0.927)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.865, 0.927)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06040fd0428195df.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the fuzzy brown rabbit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.487, 0.486)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5798edf95ab7e654.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at lower center thinner than camouflage jacket at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25e4e8652483c6f3.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.575, 0.708) and camera." }, { "from": "gpt", "value": "Point (0.575, 0.708) and camera are 3.64 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca7576067fbc7778.jpg", "conversations": [ { "from": "human", "value": "\nBetween dark blue metallic van at right and metallic red car at center right, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "Positioned to the right is metallic red car at center right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/108c34eef7ba63d4.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.007, 0.787) lie in front of point (0.169, 0.797)?" }, { "from": "gpt", "value": "No, (0.007, 0.787) is behind (0.169, 0.797)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59f78193942cc885.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown wooden house at center appear under white powdery snow at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b325c5621e06175.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the black satin suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.554, 0.592)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdb8df51813e73d6.jpg", "conversations": [ { "from": "human", "value": "\nBetween blue cotton shirt at center and shiny black fish at upper center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "shiny black fish at upper center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c92cb91dbc3d3b38.jpg", "conversations": [ { "from": "human", "value": "\nIs white fluffy rice at right further to camera compared to shiny red tomatoes at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/668848ee3e12504a.jpg", "conversations": [ { "from": "human", "value": "\nDoes beige sand at center have a greater width compared to wooden gazebo at upper left?" }, { "from": "gpt", "value": "Incorrect, beige sand at center's width does not surpass wooden gazebo at upper left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2973f66d26311e6.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, gold metallic truck at center or white matte truck at center?" }, { "from": "gpt", "value": "From the viewer's perspective, white matte truck at center appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba4f296819950656.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.304, 0.936) and point (0.107, 0.523), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.304, 0.936) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/277caea2039e2393.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.442, 0.781) and point (0.196, 0.650), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.196, 0.650)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/571b9f183bc0c88e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.071, 0.425) less distant than point (0.918, 0.966)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffd4475b21bd7a18.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the winter scene described. You want to place a small snowman exactly at the point marked by point (0.474, 0.797). Is there enough snow at white powdery snow at lower center to build a snowman there?" }, { "from": "gpt", "value": "The point (0.474, 0.797) marks white powdery snow at lower center, which is described as having a thin layer of snow with patches of grass peeking through. Since the snow is thin and has grass visible, there may not be enough snow to build a snowman at that location." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc1f0ad09037d716.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the sidewalk and see two points marked on the road. The first point is at coordinates point (0.379, 0.470) and the second point is at point (0.379, 0.541). Which point is closer to your current position on the sidewalk?" }, { "from": "gpt", "value": "Point (0.379, 0.470) is further to the camera than point (0.379, 0.541). Therefore, the point closer to your position on the sidewalk is point (0.379, 0.541)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86335f9b72fdf9c1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer who just arrived at the scene and want to take a photo of the two people in the center. The camera you have is the silver metallic camera at center. To frame the shot properly, you need to position the green matte shirt at center to the right of the camera. Is the current arrangement already set up this way?" }, { "from": "gpt", "value": "Yes, the green matte shirt at center is already positioned to the right of the silver metallic camera at center, so the current arrangement is suitable for your desired framing." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4f88874388a9301.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any smooth leather coat at center in the image." }, { "from": "gpt", "value": "[(0.292, 0.380)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/027d9789dcf9b67e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the classroom and want to reach the point marked at coordinates point (0.198, 0.456). If your walking path is clear, how far do you have to walk to get there?" }, { "from": "gpt", "value": "The point (0.198, 0.456) is 3.30 meters away from you, so you have to walk 3.30 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e0b918f50965fe5.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the white matte blazer at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.804, 0.611)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a1d3598de487e8f.jpg", "conversations": [ { "from": "human", "value": "\nBetween red fabric chair at center and light beige jacket at right, which one is positioned higher?" }, { "from": "gpt", "value": "Positioned higher is light beige jacket at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93d360bc03f4bd37.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of white stone church at center?" }, { "from": "gpt", "value": "12.87 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56502f14895ab3e1.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.481, 0.170)?" }, { "from": "gpt", "value": "matte orange cloud at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20b3745dc88e9c76.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing 1.5 meters away from the orange matte shirt at center. Can you take a clear photo of it without moving closer?" }, { "from": "gpt", "value": "The orange matte shirt at center is 1.73 meters away from the camera. Since you are standing 1.5 meters away, you are closer than the shirt, so you can take a clear photo without needing to move closer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23a6128771fb69d6.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator trying to navigate between two points in the industrial area. The first point is at coordinates point (0.189, 0.184), and the second point is at coordinates point (0.296, 0.341). Which point is closer to the dense greenery in the foreground?" }, { "from": "gpt", "value": "Point (0.296, 0.341) is closer to the dense greenery in the foreground because it is in front of point (0.189, 0.184), which is further back." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be6e8b74344de188.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellowplastic/texturedlicense plate at center is positioned to the left of matte white headlight at lower center?" }, { "from": "gpt", "value": "Correct, you'll find yellowplastic/texturedlicense plate at center to the left of matte white headlight at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b70e96c4b2bea382.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.378, 0.444) more distant than point (0.099, 0.637)?" }, { "from": "gpt", "value": "No, it is in front of (0.099, 0.637)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/393b9629d0aaca5a.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.070, 0.194) closer to viewer compared to point (0.467, 0.652)?" }, { "from": "gpt", "value": "Yes, point (0.070, 0.194) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a81e14fdca5d92df.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to dark blue hoodie at left? Please provide its 2D coordinates.Where can I find dark blue hoodie at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.293, 0.091)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c035655157424666.jpg", "conversations": [ { "from": "human", "value": "\nYou are an event organizer setting up for a presentation. You have a matte white projection screen at center and a purple matte shirt at center. Which object is wider?" }, { "from": "gpt", "value": "The matte white projection screen at center is wider than the purple matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65adfa0a4ac1efca.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a clear water at center. Pinpoint a point to the clear water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.472, 0.816)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a08ec00107b7f702.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at point (0.996, 0.592) and want to walk to point (0.269, 0.828). Based on the image, which direction should you move?" }, { "from": "gpt", "value": "You should move forward because point (0.269, 0.828) is behind point (0.996, 0.592), so moving in the direction away from the starting point will reach the destination." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7039676af32cf8b7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte gray crt monitor at center is bigger than matte black aquarium at left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c84687077e5b6828.jpg", "conversations": [ { "from": "human", "value": "\nDoes black polished stone plaque at right have a lesser height compared to metallic pole at center?" }, { "from": "gpt", "value": "Yes, black polished stone plaque at right is shorter than metallic pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b131ced9084f8bc0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the waterfront scene. You notice the blue glossy water at center and the blue matte container ship at center in your viewfinder. Which object appears larger in height when viewed from your current position?" }, { "from": "gpt", "value": "The blue glossy water at center appears much taller than the blue matte container ship at center in the scene." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29fc437924357e4c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, brown paper bag at center or clear glass bottles at lower left?" }, { "from": "gpt", "value": "Positioned to the right is brown paper bag at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78452bbb4a4d9a24.jpg", "conversations": [ { "from": "human", "value": "\nPoint to white matte jacket at center.Point to the white matte jacket at center in the image." }, { "from": "gpt", "value": "[(0.540, 0.680)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7843ceebd53a8ffa.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is matte black polo shirt at upper center from dark matte plastic cup at upper center?" }, { "from": "gpt", "value": "A distance of 2.33 meters exists between matte black polo shirt at upper center and dark matte plastic cup at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e1779d7abd7dd4c.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.263, 0.431) from camera?" }, { "from": "gpt", "value": "A distance of 26.81 meters exists between point (0.263, 0.431) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2942d54c84e40d82.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric football team at center taller than blue wool sweater at left?" }, { "from": "gpt", "value": "In fact, blue fabric football team at center may be shorter than blue wool sweater at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8647b94876bd336e.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.727, 0.416)." }, { "from": "gpt", "value": "blue fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21612e5b68a3e2c5.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, green leafy trees at center or brown feathered bird at left?" }, { "from": "gpt", "value": "brown feathered bird at left is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4ae01d03622ebc7.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.655, 0.487) and point (0.986, 0.370), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.655, 0.487) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49f5209764ce2516.jpg", "conversations": [ { "from": "human", "value": "\nIs orange mesh tank top at center further to camera compared to purple fabric shorts at right?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddbeb74f5beeea10.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue fabric shirt at lower right come behind wooden at right?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95d17aade1e61ee2.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of wooden frame at left?" }, { "from": "gpt", "value": "A distance of 4.63 meters exists between wooden frame at left and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be90fcdb98108595.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray asphalt pavement at center is positioned above metallic silver sign at upper right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf6b409b67c719fc.jpg", "conversations": [ { "from": "human", "value": "\nIs multicolored fabric bikini top at upper right shorter than red silk dress at back?" }, { "from": "gpt", "value": "No, multicolored fabric bikini top at upper right is not shorter than red silk dress at back." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7369243843d5d9b5.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center appear over black matte soccer player at center?" }, { "from": "gpt", "value": "Actually, green grass at center is below black matte soccer player at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2326b554cdf4c58e.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of brown rough bark tree at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.062, 0.130)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/499b5d3105cec2e0.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the smooth black fence at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.538, 0.842)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/081cfb157127d22f.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the bearded man at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.960, 0.791)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8296806b2232838e.jpg", "conversations": [ { "from": "human", "value": "\nBetween green textured palm tree at right and green leafy palm tree at right, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "Positioned to the right is green textured palm tree at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57ffaf1c9364bee4.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic silver can at center below black plastic keyboard at center?" }, { "from": "gpt", "value": "Correct, metallic silver can at center is located below black plastic keyboard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/978cf4dd03892ee2.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.044, 0.698) and camera." }, { "from": "gpt", "value": "The distance of point (0.044, 0.698) from camera is 8.61 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6e874e369dd00e5.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of dusty brown dirt field at center in the image." }, { "from": "gpt", "value": "[(0.493, 0.814)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e00e62a6ba23b8d7.jpg", "conversations": [ { "from": "human", "value": "\nYou are driving a car and need to check the position of the black glossy dashboard at center relative to the point marked at coordinates (0.526, 0.878). Is the dashboard exactly at that point?" }, { "from": "gpt", "value": "Yes, the black glossy dashboard at center is located exactly at point (0.526, 0.878)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80c9ce499126890e.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the striped cotton shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.591, 0.787)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02f0f2a3f2b25572.jpg", "conversations": [ { "from": "human", "value": "\nLocate the black plastic letter v at center in the image." }, { "from": "gpt", "value": "[(0.252, 0.694)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9d3f666baeed467.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the two panels in the park. You want to take a closer look at the blue glossy map at center on the left panel. Considering you can only move forward 3 meters, will you be able to reach it?" }, { "from": "gpt", "value": "The blue glossy map at center is 5.00 meters away from the camera. Since you can only move forward 3 meters, you will not be able to reach it as the distance is greater than your movement capability." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84ce64c582c365cc.jpg", "conversations": [ { "from": "human", "value": "\nDoes glossy blue sedan at right appear on the right side of white plastic license plate at center?" }, { "from": "gpt", "value": "Indeed, glossy blue sedan at right is positioned on the right side of white plastic license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c41e95da74ad5069.jpg", "conversations": [ { "from": "human", "value": "\nDoes black leather jacket at left have a lesser width compared to matte red cardigan at center?" }, { "from": "gpt", "value": "Yes, black leather jacket at left is thinner than matte red cardigan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad42bbb75e007f57.jpg", "conversations": [ { "from": "human", "value": "\nHow distant is snow-covered evergreen tree at center from wooden cabin at center?" }, { "from": "gpt", "value": "snow-covered evergreen tree at center and wooden cabin at center are 16.68 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/763295eb98f188d8.jpg", "conversations": [ { "from": "human", "value": "\nIs blue paper at center below fuzzy brown bear at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0d587d812bdefd0.jpg", "conversations": [ { "from": "human", "value": "\nIs dry grass at center positioned in front of green leafy tree at upper right?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3ce29a316bc5ab0.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.545, 0.548) positioned after point (0.755, 0.597)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba97d84803d8453e.jpg", "conversations": [ { "from": "human", "value": "\nIs gray asphalt at center smaller than black rubber pole at right?" }, { "from": "gpt", "value": "No, gray asphalt at center is not smaller than black rubber pole at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07e234b925cc908c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to navigate through the busy street. You see two traffic lights ahead. The first is the black matte traffic light at upper center and the second is the black plastic traffic light at center. Which traffic light is on the left side when looking towards them?" }, { "from": "gpt", "value": "The black matte traffic light at upper center is positioned on the left side of the black plastic traffic light at center, so when looking towards them, the black matte traffic light at upper center is on the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1fdcfa2b9a619383.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the beige glass building at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.411, 0.455)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5927a2831961b98.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the stone wall with the arched doorway. There is a point marked at coordinates point (0.594, 0.669). If you want to reach that point, how far do you need to walk?" }, { "from": "gpt", "value": "The point (0.594, 0.669) is 8.38 meters away from you, so you need to walk 8.38 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09fe1ca707461a87.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of two chairs against a wall. You notice two specific points marked on the chairs. The first point is at coordinate point (0.467, 0.652) and the second is at point (0.309, 0.506). From your perspective, which point is closer to you?" }, { "from": "gpt", "value": "Point (0.309, 0.506) is closer to you because it is in front of point (0.467, 0.652), which is behind it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6c6ecfe98990ca7.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, brown matte hair at center or matte skin at center?" }, { "from": "gpt", "value": "From the viewer's perspective, brown matte hair at center appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48f7637018336ae2.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.548, 0.823) come farther from viewer compared to point (0.467, 0.372)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a21fbb7a30fd771b.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, gray matte bird at left or white matte bird at center?" }, { "from": "gpt", "value": "white matte bird at center is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e8631bb72186320.jpg", "conversations": [ { "from": "human", "value": "\nWhere is pink velvet gown at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.732, 0.733)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/909f619dcb1f47c0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, white matte shirt at left or white cloth at upper left, stands shorter?" }, { "from": "gpt", "value": "white cloth at upper left is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ed2f1050c76ab81.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.218, 0.986) positioned after point (0.069, 0.567)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b68f33c19b9e210.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a green grass at center. Pinpoint a point to the green grass at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.540, 0.902)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6400de2365bfbc54.jpg", "conversations": [ { "from": "human", "value": "\nYou are sitting in the front row of the lecture hall and notice the brown wood podium at lower left. How far is the podium from your current position?" }, { "from": "gpt", "value": "The brown wood podium at lower left is 9.86 feet from the viewer, so it is approximately 9.86 feet away from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b23157738e1d1b2b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the gray brick pavement at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.519, 0.738)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/464b99a2a070627a.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green smooth asparagus at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.484, 0.470)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82c15422acc74846.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.181, 0.308) or point (0.294, 0.134)?" }, { "from": "gpt", "value": "Point (0.181, 0.308)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e7d0357f317eacd.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between light brown wool coat at center and camera." }, { "from": "gpt", "value": "light brown wool coat at center and camera are 11.16 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2771040ea7921072.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the United States Capitol building and notice two green leafy trees in the image. Which tree, the green leafy tree at upper center or the green leafy tree at upper left, is positioned more to the right side of the scene?" }, { "from": "gpt", "value": "The green leafy tree at upper center is positioned more to the right side of the scene compared to the green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0972ffe45c6f639d.jpg", "conversations": [ { "from": "human", "value": "\nHow far is clear glass mirror at center from camera?" }, { "from": "gpt", "value": "clear glass mirror at center and camera are 18.01 inches apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/880f6cdadfc875e6.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.494, 0.727) and point (0.686, 0.319), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.686, 0.319) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6951ea8ec5b5cb41.jpg", "conversations": [ { "from": "human", "value": "\nBetween black glossy monitor at center and black plastic keyboard at center, which one is positioned lower?" }, { "from": "gpt", "value": "black plastic keyboard at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87af39356818eb5e.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white fabric tank top at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.077, 0.708)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6153ed1e08d26c79.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of black matte coat at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.462, 0.778)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8dc4fa006df69e23.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange matte lifeboat at upper left is smaller than brown wooden deck at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/472205fb4f45dc82.jpg", "conversations": [ { "from": "human", "value": "\nIs green algae-covered water at center below green grassy at center?" }, { "from": "gpt", "value": "Correct, green algae-covered water at center is located below green grassy at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/764d1ef80b108e70.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is dark brown hair at right from camera?" }, { "from": "gpt", "value": "A distance of 20.28 inches exists between dark brown hair at right and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37d0887453173169.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, white matte shirt at center or pink fabric shorts at center?" }, { "from": "gpt", "value": "Positioned to the left is white matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb9b134150a4fa15.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.729, 0.573) positioned before point (0.342, 0.569)?" }, { "from": "gpt", "value": "No, it is behind (0.342, 0.569)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd85e413301bf9e8.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the gray stone carving at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.484, 0.597)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94f4c3f7939c03f6.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing items on a desk and need to place a new object between the black matte speaker at lower center and the brown scaly lizard at lower left. Is there enough space between them to fit a small notebook?" }, { "from": "gpt", "value": "The black matte speaker at lower center is to the right of the brown scaly lizard at lower left, so there is space between them. A small notebook can be placed between the black matte speaker at lower center and the brown scaly lizard at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1617364fb1d0626.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of black fabric jacket at center?" }, { "from": "gpt", "value": "4.05 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/059a79cf961f44e9.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a small event in this room and need to place a large banner that requires a surface bigger than the black suit at right. Can the brown wooden table at center accommodate it?" }, { "from": "gpt", "value": "The brown wooden table at center is larger in size than the black suit at right, so yes, the banner can be placed on the brown wooden table at center since it has sufficient space." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14ad67a44ff29cfd.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.492, 0.472) or point (0.308, 0.589)?" }, { "from": "gpt", "value": "Point (0.308, 0.589)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e90de29a9b7d030.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the child in the image. The client wants to ensure the hand and eye are visible. Based on the scene, can you confirm if the smooth skin hand at left is not covering the pink glossy eye at center?" }, { "from": "gpt", "value": "The smooth skin hand at left is positioned on the left side of the pink glossy eye at center, so it is not covering the eye and both are visible." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/535f27c33a2c5e4c.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.742, 0.739) and camera." }, { "from": "gpt", "value": "Point (0.742, 0.739) is 1.99 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e3f586f31d9fc58.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.882, 0.452) from camera?" }, { "from": "gpt", "value": "A distance of 29.73 inches exists between point (0.882, 0.452) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86314b5065827cbf.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.301, 0.650)?" }, { "from": "gpt", "value": "smooth concrete water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/121430be5d32d416.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black suit at center appear over transparent plastic microphone at center?" }, { "from": "gpt", "value": "Indeed, matte black suit at center is positioned over transparent plastic microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/208ef57dec93c43c.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black hoodie at center appear on the right side of blue plastic megaphone at center?" }, { "from": "gpt", "value": "In fact, matte black hoodie at center is to the left of blue plastic megaphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d9017ba35dc2df6.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between white fabric canopy at upper center and camera?" }, { "from": "gpt", "value": "34.58 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/772ffa6cbb222ee7.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.766, 0.505) positioned in front of point (0.523, 0.523)?" }, { "from": "gpt", "value": "Yes, point (0.766, 0.505) is in front of point (0.523, 0.523)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1eca2b115f2410b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green tie-dye shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.558, 0.487)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff52958529941d90.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.558, 0.431)?" }, { "from": "gpt", "value": "wooden at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4f3bf1ebfdb300e.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between green leafy trees at left and green leafy trees at right." }, { "from": "gpt", "value": "A distance of 151.28 feet exists between green leafy trees at left and green leafy trees at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbca4240f1b2b1b6.jpg", "conversations": [ { "from": "human", "value": "\nHow much distance is there between shiny red apple at upper right and smooth yellow orange at center?" }, { "from": "gpt", "value": "3.35 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08ac6f72926aada3.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the community hall watching the lion dance performance. You notice the black fabric pants at left in the crowd. If you want to approach them, how far would you have to walk?" }, { "from": "gpt", "value": "The black fabric pants at left are 6.96 meters away from the viewer, so you would need to walk approximately 6.96 meters to reach them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3160d874a2323bae.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.849, 0.233) and point (0.619, 0.858), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.849, 0.233) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03c9ce14db9c4441.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, green leafy palm tree at right or green leafy palm tree at center?" }, { "from": "gpt", "value": "green leafy palm tree at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1489fb7bca5ec75f.jpg", "conversations": [ { "from": "human", "value": "\nWhere is blue glossy cupcake at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.482, 0.419)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48d4bf8580c4aaa0.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.402, 0.697) and point (0.160, 0.395), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.160, 0.395)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41365c78eb09090f.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white wax candle at lower left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.049, 0.823)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2118f5f54f4adb26.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance measurement between pink matte shirt at center and matte gray t-shirt at center?" }, { "from": "gpt", "value": "pink matte shirt at center is 23.07 feet from matte gray t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0e504bc450c5167.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark blue jacket at lower left located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.021, 0.966)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db413763902bf1ba.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to take a photo of the scene. There is a point at coordinates point (0.829, 0.498). How far is that point from you?" }, { "from": "gpt", "value": "The point at coordinates point (0.829, 0.498) is 19.22 inches away from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c0ef3281fb5492f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker planning to cross from the matte gray rock at center to the green smooth rock at lower center. Which rock will you step onto first?" }, { "from": "gpt", "value": "You will step onto the matte gray rock at center first because it is closer to you than the green smooth rock at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d0af88cb8a10e8d.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.511, 0.664) and camera." }, { "from": "gpt", "value": "The distance of point (0.511, 0.664) from camera is 74.01 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2cf8549a7e4f9f7.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of white fluffy cloud at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.523, 0.333)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36bbced3ec74990c.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, matte green tree at center or green matte skateboard at upper left?" }, { "from": "gpt", "value": "Positioned to the left is green matte skateboard at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a39c6591c89c0002.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of black metal railing at lower center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.469, 0.950)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7d2acba1f4ec0c6.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte boat at lower center bigger than white matte boat at center?" }, { "from": "gpt", "value": "Correct, white matte boat at lower center is larger in size than white matte boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f8cf715fc534de0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the dog show and want to capture a closeup of the black matte skirt at center. Where exactly should you focus your camera?" }, { "from": "gpt", "value": "You should focus your camera at point 0.267 on the x axis and 0.622 on the y axis to capture the black matte skirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/522829aefefe8075.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the historic stone gatehouse and notice a point marked at coordinates (0.438, 0.930). Based on the scene description, can you determine what surface this point is located on?" }, { "from": "gpt", "value": "The point is located on the brown stone alley at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6860cdd5f0ea11b.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a shiny black horse at center. Pinpoint a point to the shiny black horse at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.486, 0.502)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e3c57ef36a89196.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the pedestrian bridge and see the denim shorts at lower left. Where exactly are they located on the bridge?" }, { "from": "gpt", "value": "The denim shorts at lower left are located at point (0.146, 0.889) on the bridge." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1851e869da7f9395.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in front of the green checkered shirt at center. You want to take a closeup shot of the shirt. The camera you are using has a minimum focusing distance of 1 meter. Can you focus on the shirt without moving closer?" }, { "from": "gpt", "value": "The green checkered shirt at center and viewer are 76.00 centimeters apart. Since the minimum focusing distance is 1 meter, the camera cannot focus on the shirt from this distance. You need to move back or adjust the camera settings." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06b696eecd5919a2.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.561, 0.569)?" }, { "from": "gpt", "value": "floral chiffon dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8345b83146d2835.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of green polished stone monument at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.567, 0.452)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7d95bca484f4d29.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of black sequined scarf at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.344, 0.662)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb706404cf8143d9.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.691, 0.547) positioned behind point (0.585, 0.603)?" }, { "from": "gpt", "value": "No, (0.691, 0.547) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd7319066d1d281a.jpg", "conversations": [ { "from": "human", "value": "\nLocate polished metallic spheres at center in the image." }, { "from": "gpt", "value": "[(0.498, 0.472)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e75b60dcfa7bc58f.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.502, 0.508) from camera?" }, { "from": "gpt", "value": "Point (0.502, 0.508) and camera are 3.57 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39b4713a27bffdd8.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of matte paper cup at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.362, 0.586)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4829383fc7d5abaa.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny metallic helmet at center have a lesser height compared to matte white dress at upper left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8778d11a53d56a34.jpg", "conversations": [ { "from": "human", "value": "\nYou are designing a new bathroom layout and need to place the white plastic scale at center so that it accommodates both the light skin textured foot at center and another similar foot. Given that the scale is bigger than the foot, will the scale provide enough space for both feet?" }, { "from": "gpt", "value": "The white plastic scale at center is bigger than the light skin textured foot at center, so yes, the scale should provide enough space to accommodate both feet since it is larger than a single foot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5626c36cdb446458.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing an event and need to choose between the matte black helmet at center and the black glossy helmet at center for a demonstration. Which helmet has a larger size?" }, { "from": "gpt", "value": "The matte black helmet at center is bigger than the black glossy helmet at center, so the matte black helmet at center has a larger size." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de69c4d97458920e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the museum and want to touch the dark gray sweater at left. How far do you need to walk to reach it?" }, { "from": "gpt", "value": "The dark gray sweater at left is 3.70 meters from the viewer, so you need to walk 3.70 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/091d664d96230041.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.471, 0.245) and point (0.411, 0.231), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.471, 0.245) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b035f2cfc12de72.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black shorts at left in front of matte blue shorts at center?" }, { "from": "gpt", "value": "Yes, matte black shorts at left is in front of matte blue shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a02e59e62c697cdc.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of green cotton cloth at upper center in the image." }, { "from": "gpt", "value": "[(0.728, 0.528)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7281ea289bc68b1.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of golden glass beer at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.681, 0.736)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e74c37f76bb1bc5.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.693, 0.181) and point (0.648, 0.248), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.693, 0.181) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b609ced84729373e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.048, 0.542) positioned before point (0.407, 0.667)?" }, { "from": "gpt", "value": "Yes, point (0.048, 0.542) is in front of point (0.407, 0.667)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0849be732790feb6.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.662, 0.497) or (0.742, 0.484)?" }, { "from": "gpt", "value": "Positioned behind is point (0.662, 0.497)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e8d624aa651a8af.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the metallic silver shelter at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.920, 0.475)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0eda26a12087b6f2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a safety inspector checking the shooting range. You notice the camouflage uniform at left and the camouflage textured rifle at center. Which object is taller?" }, { "from": "gpt", "value": "The camouflage uniform at left is taller than the camouflage textured rifle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2162c2beba6f835e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic cockpit at center is positioned to the left of camouflage uniform at right?" }, { "from": "gpt", "value": "Correct, you'll find metallic cockpit at center to the left of camouflage uniform at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3998d5525a846ee2.jpg", "conversations": [ { "from": "human", "value": "\nBetween plaid fabric backpack at center and matte green jacket at center, which one has less height?" }, { "from": "gpt", "value": "With less height is matte green jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0932c6f7135959f9.jpg", "conversations": [ { "from": "human", "value": "\nYou are at an outdoor event and see the matte red jacket at left and the red fabric umbrella at upper center. Which object is smaller in size?" }, { "from": "gpt", "value": "The matte red jacket at left is smaller in size compared to the red fabric umbrella at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94588981c2124d3f.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.256, 0.855) and point (0.835, 0.195), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.256, 0.855) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14ba894b82fe75e4.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy palm tree at left shorter than green leafy palm tree at right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b874d9ef584f901.jpg", "conversations": [ { "from": "human", "value": "\nA drone is flying at a height of 10 meters above the ground. It needs to capture a photo of the point at (0.247, 0.916) while avoiding the traffic signal pole. Given that the traffic signal pole is 12 meters tall, will the drone be able to fly under the pole and still get a clear shot of the point?" }, { "from": "gpt", "value": "The traffic signal pole is 12 meters tall, and the drone is flying at 10 meters. Since the drone is below the pole, it can fly under the pole and still capture the point at (0.247, 0.916) as long as there are no other obstructions between them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5867355a012f529d.jpg", "conversations": [ { "from": "human", "value": "\nBetween concrete at center and matte black jacket at center, which one is positioned lower?" }, { "from": "gpt", "value": "concrete at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01d6551716dd7848.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the front of the parade float and see the point marked at coordinates (0.937, 0.830). What object is located at that point?" }, { "from": "gpt", "value": "The point at coordinates (0.937, 0.830) marks the white cotton shirt at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c41e02f26cc80b2.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the bar cart and want to place a 10 cm tall watermelon matte at lower center on the top shelf. Can you determine if there is enough vertical space between the top shelf and the decorative pink oval mirror to accommodate it?" }, { "from": "gpt", "value": "The watermelon matte at lower center is 8.57 feet away from the viewer, but the vertical space between the top shelf and the decorative pink oval mirror isn" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c48142c05c42316e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.638, 0.277) closer to camera compared to point (0.708, 0.211)?" }, { "from": "gpt", "value": "No, it is behind (0.708, 0.211)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fbbdc13b109f257.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.154, 0.145) closer to camera compared to point (0.822, 0.325)?" }, { "from": "gpt", "value": "Yes, point (0.154, 0.145) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c92f0653964957d7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue denim jeans at upper center is smaller than matte pink pants at left?" }, { "from": "gpt", "value": "Indeed, blue denim jeans at upper center has a smaller size compared to matte pink pants at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d39d0e1e0b925aba.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte boat at center to the left of blue plastic canoe at lower left from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, white matte boat at center is not on the left side of blue plastic canoe at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fcce71fb66e7068.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.907, 0.716) farther from camera compared to point (0.324, 0.741)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ec0a4e2c8cd4e18.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of purple knitted neckband at center in the image." }, { "from": "gpt", "value": "[(0.700, 0.658)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/218fc49bcdcaf1a1.jpg", "conversations": [ { "from": "human", "value": "\nWhere is plaid fabric umbrella at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.822, 0.592)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a33b0181802fffa.jpg", "conversations": [ { "from": "human", "value": "\nYou are a soccer player trying to locate the ball during a break in play. The ball is at the point marked as point (0.571, 0.302). Which object in the scene is the ball closest to?" }, { "from": "gpt", "value": "The ball at point (0.571, 0.302) is on the maroon jersey at upper center, so it is closest to that object." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0839888ef657930f.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any brown wood at center in the image." }, { "from": "gpt", "value": "[(0.595, 0.958)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0266f3c7c5c76e15.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the concert and want to take a photo of the blue cotton shirt at center and the black matte headphones at left. Which object should you focus on first if you want to capture both in the same frame without moving the camera?" }, { "from": "gpt", "value": "The black matte headphones at left should be focused on first because they are positioned to the left of the blue cotton shirt at center, so adjusting focus from left to right would naturally include both in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1c6c353296ca2af.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.119, 0.308) come closer to viewer compared to point (0.760, 0.633)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.760, 0.633)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0762f5c378cc4758.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green grass at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.480, 0.825)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07f7e7626c0cb499.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue water at lower left is positioned to the right of red jacket at left?" }, { "from": "gpt", "value": "In fact, blue water at lower left is to the left of red jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04043d9d47853d76.jpg", "conversations": [ { "from": "human", "value": "\nHow much distance is there between smooth concrete pavement at center and pink rubber bicycle at left?" }, { "from": "gpt", "value": "smooth concrete pavement at center and pink rubber bicycle at left are 2.38 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18eb4e9487b7d89b.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.787, 0.444) come farther from viewer compared to point (0.860, 0.412)?" }, { "from": "gpt", "value": "No, (0.787, 0.444) is in front of (0.860, 0.412)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53f4e8a37361048a.jpg", "conversations": [ { "from": "human", "value": "\nLocate the pink chalk writing at center in the image." }, { "from": "gpt", "value": "[(0.439, 0.375)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cb76fdbd3d3ec78.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point labeled point (0.905, 0.947). There is another person 5.15 meters away from you. Can you see them clearly?" }, { "from": "gpt", "value": "Yes, because the other person is 5.15 meters away from you, which is within a typical visibility range, so you can see them clearly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c1de39e031e3a16.jpg", "conversations": [ { "from": "human", "value": "\nHow close is brown woolen suit at right from dark gray suit at center?" }, { "from": "gpt", "value": "20.91 inches" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb79b85420b17190.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black suit at center lie behind blue cotton shirt at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96c0f72d0374f276.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the blue fabric backpack at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.331, 0.794)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de212e062a587d49.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte black shirt at center and brown matte shirt at lower right, which one has more height?" }, { "from": "gpt", "value": "With more height is matte black shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b544b3a9833f2b1.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.527, 0.511) in front of point (0.448, 0.717)?" }, { "from": "gpt", "value": "No, (0.527, 0.511) is behind (0.448, 0.717)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab9728b4af6fce17.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown textured tree at center have a greater height compared to matte pink tree at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cbe6e983128c20d.jpg", "conversations": [ { "from": "human", "value": "\nYou are an airplane pilot flying over the mountainous landscape. You notice the white fluffy cloud at upper left and the snowy granite mountain range at center. Which one appears higher in the sky from your perspective?" }, { "from": "gpt", "value": "The white fluffy cloud at upper left appears higher in the sky than the snowy granite mountain range at center because it is much taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9ba9def668fbe48.jpg", "conversations": [ { "from": "human", "value": "\nYou are a spectator sitting behind the green netting at the baseball game. You want to throw a small ball to the player wearing the white matte uniform at center. Considering the netting is 10 feet away from you, can you reach the player with your throw?" }, { "from": "gpt", "value": "The white matte uniform at center is 24.53 feet away from the camera. Since the netting is 10 feet away from you, the remaining distance to the player is 14.53 feet. You can likely reach the player with your throw." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d4eea8647ea7994.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.978, 0.983) and point (0.434, 0.469), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.978, 0.983)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d9763e0f72bb300.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, concrete bridge at left or white metallic train at center, stands shorter?" }, { "from": "gpt", "value": "With less height is white metallic train at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/074c03ec4064d64a.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of red fleece jacket at upper left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.198, 0.120)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b76d9b5bc53d9504.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, green textured trees at right or snowy white mountain range at upper left?" }, { "from": "gpt", "value": "green textured trees at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e492138809eded15.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer at this fast food restaurant and you want to order the white creamy ice cream at center. The server is wearing the floral fabric top at center. Where should you look to place your order?" }, { "from": "gpt", "value": "You should look at the server wearing the floral fabric top at center because the floral fabric top at center is above the white creamy ice cream at center, indicating their position relative to the ice cream." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/551305867788c6b5.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a blue floral skirt at lower center. Pinpoint a point to the blue floral skirt at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.674, 0.791)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4506c6ff8f357ff6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth red concrete stairs at center is positioned above smooth skin baby at center?" }, { "from": "gpt", "value": "Actually, smooth red concrete stairs at center is below smooth skin baby at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8d47cf41188ba71.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray jeans at lower left shorter than dark brown coat at left?" }, { "from": "gpt", "value": "Incorrect, dark gray jeans at lower left's height does not fall short of dark brown coat at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85f0bd5d0f5d4449.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the man in the brown velvety blazer at center. You want to focus on the exact point at coordinates point (0.553, 0.623). Is this point located on the man or somewhere else?" }, { "from": "gpt", "value": "The point (0.553, 0.623) is on the brown velvety blazer at center, so yes, it is located on the man." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c78dc58cdae1a6d3.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark brown textured tree at lower center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.479, 0.947)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76a3b91b86421c08.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, transparent glass tower at center or red glass traffic light at right?" }, { "from": "gpt", "value": "red glass traffic light at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afeaa7c74c95b1dc.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.460, 0.188) or point (0.879, 0.602)?" }, { "from": "gpt", "value": "The point (0.460, 0.188) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f2957de384ae4a2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if stone steps at center is wider than dark blue shirt at right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/694d9df011e43660.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between green and white fabric flag at upper center and camera?" }, { "from": "gpt", "value": "The distance of green and white fabric flag at upper center from camera is 25.21 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/386ae3ecc1027eed.jpg", "conversations": [ { "from": "human", "value": "\nIs matte plastic toy at left shorter than pastel wax candles at center?" }, { "from": "gpt", "value": "Incorrect, matte plastic toy at left's height does not fall short of pastel wax candles at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6844bc9c47902160.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.946, 0.559) positioned behind point (0.685, 0.511)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b3beb1bd0602f1f.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, yellow fabric bowl at center or smooth black pants at lower left?" }, { "from": "gpt", "value": "Standing shorter between the two is yellow fabric bowl at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b97445ca9dc19ae8.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is shiny black sedan at center-right from shiny black sedan at center?" }, { "from": "gpt", "value": "shiny black sedan at center-right is 20.25 feet from shiny black sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7412bbc423daf128.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.052, 0.717) or point (0.677, 0.666)?" }, { "from": "gpt", "value": "Positioned in front is point (0.677, 0.666)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d8e7b40dfc0c8d8.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange fabric folding chair at left appear on the left side of orange fabric beach chair at center?" }, { "from": "gpt", "value": "Indeed, orange fabric folding chair at left is positioned on the left side of orange fabric beach chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5dd5a2d05844e8c.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue liquid water at center have a lesser height compared to white glossy boat at left?" }, { "from": "gpt", "value": "Incorrect, blue liquid water at center's height does not fall short of white glossy boat at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddc6c82cd6831ebc.jpg", "conversations": [ { "from": "human", "value": "\nBetween green satin hanbok at center and black matte vest at left, which one has more height?" }, { "from": "gpt", "value": "Standing taller between the two is black matte vest at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da9a34d90037a94d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up a shoot in this bar scene. You notice the white printed shirt at center and the translucent plastic table at center. Based on their heights, which object should you adjust your camera angle to focus on first?" }, { "from": "gpt", "value": "The white printed shirt at center has a greater height compared to the translucent plastic table at center, so you should adjust your camera angle to focus on the white printed shirt at center first." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a75d324fe9aa195b.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.827, 0.500) from camera?" }, { "from": "gpt", "value": "21.74 inches" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03b029e1578b0fba.jpg", "conversations": [ { "from": "human", "value": "\nYou are an inspector evaluating the building for safety concerns. You notice a point at coordinates (0.831, 0.623) on the building facade. What is the object located at this coordinate?" }, { "from": "gpt", "value": "The point at coordinates (0.831, 0.623) indicates a metallic wire at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9abf0ab6a818bc61.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte black flute at left located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.302, 0.708)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e08dcb971bdfb31.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black shirt at lower left have a greater width compared to dark blue uniform at center?" }, { "from": "gpt", "value": "Correct, the width of matte black shirt at lower left exceeds that of dark blue uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45ff9e67960f2a75.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.535, 0.645)?" }, { "from": "gpt", "value": "clear blue water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aad3b217de9ba640.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.531, 0.144) more distant than point (0.342, 0.175)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db9ec7d838772629.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the celebration and want to capture a photo where both the gray cotton polo shirt at center and the blonde hair at upper left are visible. Based on their heights, which one is more likely to be fully visible in the shot?" }, { "from": "gpt", "value": "The gray cotton polo shirt at center has a greater height compared to blonde hair at upper left, so it is more likely to be fully visible in the photo." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdbbbb882b76ef62.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from pink flesh-colored tongue at center to camera." }, { "from": "gpt", "value": "pink flesh-colored tongue at center and camera are 12.93 inches apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2f1c1f161ccaa12.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.225, 0.545) positioned behind point (0.351, 0.706)?" }, { "from": "gpt", "value": "Yes, point (0.225, 0.545) is behind point (0.351, 0.706)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef7aad8e204d8cf7.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass football field at center thinner than textured fabric crowd at upper center?" }, { "from": "gpt", "value": "Yes, green grass football field at center is thinner than textured fabric crowd at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12dacc3748cc068d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to black glossy monitor at center.Point to the black glossy monitor at center in the image." }, { "from": "gpt", "value": "[(0.506, 0.414)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/338deafde3a2f8a9.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.588, 0.527)?" }, { "from": "gpt", "value": "matte plastic figure at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b05d35a8a5ef360.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of metallic mesh chair at lower center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.444, 0.852)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1d36d47b02bd6c5.jpg", "conversations": [ { "from": "human", "value": "\nLocate dark fabric figure at center in the image." }, { "from": "gpt", "value": "[(0.580, 0.717)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b7f7559166d6857.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the metallic gray bridge at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.364, 0.373)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffc1887838404c46.jpg", "conversations": [ { "from": "human", "value": "\nYou are an interior designer assessing a room with a skylight and artwork. You notice a black leather pillow at upper right and a white paper at center. Which object takes up more space in the visual field?" }, { "from": "gpt", "value": "The black leather pillow at upper right is bigger than the white paper at center, so it takes up more space in the visual field." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7caf267144fae66c.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown wooden path at center have a greater width compared to brown/thatched roof at upper center?" }, { "from": "gpt", "value": "In fact, brown wooden path at center might be narrower than brown/thatched roof at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08b097deaa0fe7f5.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance measurement between light brown wooden slats at right and white soft pillow at lower center?" }, { "from": "gpt", "value": "light brown wooden slats at right is 2.79 meters away from white soft pillow at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fb09a39cbf39da4.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue uniform at center appear on the right side of dark brown hair at center?" }, { "from": "gpt", "value": "Indeed, dark blue uniform at center is positioned on the right side of dark brown hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15cb948f59e73da6.jpg", "conversations": [ { "from": "human", "value": "\nWhere is clear water at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.553, 0.892)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cdfa127d846dde43.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, white fluffy cloud at upper center or rustic wire at center?" }, { "from": "gpt", "value": "Standing shorter between the two is rustic wire at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9b7bcbf349bd90e.jpg", "conversations": [ { "from": "human", "value": "\nDoes patterned fabric dress at center have a lesser height compared to geometric-patterned fabric at left?" }, { "from": "gpt", "value": "In fact, patterned fabric dress at center may be taller than geometric-patterned fabric at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4dc266bbae61bedf.jpg", "conversations": [ { "from": "human", "value": "\nDoes floral fabric shirt at center have a lesser width compared to matte gold ring at upper right?" }, { "from": "gpt", "value": "Incorrect, floral fabric shirt at center's width is not less than matte gold ring at upper right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a18bf7f406db827b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if stained concrete pillar at center is taller than white brick pillar at center?" }, { "from": "gpt", "value": "Correct, stained concrete pillar at center is much taller as white brick pillar at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cea55969a643d816.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, matte red sweater at center or green leather jacket at center?" }, { "from": "gpt", "value": "green leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa453f1e294af5ee.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of smooth sand dune at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.301, 0.331)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98d93f77ad4c9ce4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the sunset scene. You want to ensure that both the green leafy tree at upper right and the smooth water at center are in focus. Based on their positions, which object should you focus on to maximize the depth of field for both?" }, { "from": "gpt", "value": "You should focus on the green leafy tree at upper right because it is located above the smooth water at center, so focusing on the closer object will help keep both in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62cd9b59bfcd1301.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.756, 0.164) closer to camera compared to point (0.912, 0.152)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15c5f4de45ca6b4c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a closeup shot of the raccoon on the left. You notice two points in the scene marked as point 1 at coordinates point (0.407, 0.412) and point 2 at coordinates point (0.014, 0.123). Which point should you focus on to ensure the raccoon on the left is in sharp focus?" }, { "from": "gpt", "value": "Point (0.407, 0.412) is closer to the camera than point (0.014, 0.123), so you should focus on point (0.407, 0.412) to ensure the raccoon on the left is in sharp focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/555efc24f0d6971b.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.732, 0.908) come farther from viewer compared to point (0.369, 0.963)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5495902667f3423.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte white lights at left located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.150, 0.436)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/020c68c93822b099.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the traditional thatched roof structure and notice two items at the center of the scene. Which item is located to the left of the other? The brown sandy ground at center and the yellow cotton tank top at center." }, { "from": "gpt", "value": "The yellow cotton tank top at center is to the left of the brown sandy ground at center because the brown sandy ground at center is positioned on the right side of the yellow cotton tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c79d8b951bf51d10.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black laptop at left have a greater width compared to white hair at center?" }, { "from": "gpt", "value": "Incorrect, matte black laptop at left's width does not surpass white hair at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/724f4223518882ec.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the garden and want to walk towards the historic structure in the background. You notice two points marked in the scene. Which point, point (0.441, 0.553) or point (0.147, 0.383), is closer to you as you face the garden?" }, { "from": "gpt", "value": "Point (0.441, 0.553) is closer to the viewer than point (0.147, 0.383)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70b0d25e6416417d.jpg", "conversations": [ { "from": "human", "value": "\nLocate all matte black computer tower at center in the image." }, { "from": "gpt", "value": "[(0.160, 0.523)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64560f706c76cceb.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to move the green metallic pole at lower left to the location where the green painted wood hut at center is currently. Will the pole fit in the space if you move it there?" }, { "from": "gpt", "value": "The green painted wood hut at center is wider than the green metallic pole at lower left. Since the pole is narrower, it will fit in the space where the hut is currently located." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/faf293c041578f63.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between matte black shirt at left and white sailboat at left?" }, { "from": "gpt", "value": "140.64 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80a17bc6bd55e269.jpg", "conversations": [ { "from": "human", "value": "\nDoes green plastic boat at center have a smaller size compared to blue plastic kayak at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/761a29061e0aba3c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a snorkeler trying to adjust your gear. You need to reach your transparent rubber goggles at center while holding onto your black matte shorts at center. Which direction should you move your hand to grab the goggles?" }, { "from": "gpt", "value": "The transparent rubber goggles at center are to the right of the black matte shorts at center. So you should move your hand to the right to grab the transparent rubber goggles at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf649b3ba1707125.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.986, 0.945) come in front of point (0.069, 0.578)?" }, { "from": "gpt", "value": "Yes, point (0.986, 0.945) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8df8a17b6a7d2147.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the brick railing in the foreground. You want to capture a photo that includes both the blue glass water at center and the bronze polished lamp post at center right. Based on their positions, will the lamp post appear above or below the water in the photo?" }, { "from": "gpt", "value": "The blue glass water at center is below the bronze polished lamp post at center right, so in the photo, the lamp post will appear above the water." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f7fb04f1bf673ca.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, smooth plastic face at center or matte striped shirt at center?" }, { "from": "gpt", "value": "Standing taller between the two is matte striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18e3cc20c95f0a15.jpg", "conversations": [ { "from": "human", "value": "\nYou are a guest at this event and want to grab a drink from the translucent glass cup at center without disturbing the man in the white checkered shirt at center. What is the minimum distance you need to move to reach the cup?" }, { "from": "gpt", "value": "The minimum distance you need to move is 6.95 meters to reach the translucent glass cup at center from the white checkered shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0c493e87cb25531.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.924, 0.912) and point (0.249, 0.627), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.249, 0.627) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc37f70f7132d390.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the concrete at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.030, 0.177)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b24bcfe33de1d0f.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, smooth brown bark at left or blue cotton shirt at lower right?" }, { "from": "gpt", "value": "smooth brown bark at left is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ef727123879c29c.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of matte black dress at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.523, 0.356)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/026c3c7cc8e679e6.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.077, 0.850) or point (0.912, 0.861)?" }, { "from": "gpt", "value": "Point (0.077, 0.850) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f23cf6af15562b6.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, white fabric shirt at center or sunglasses at center?" }, { "from": "gpt", "value": "From the viewer's perspective, white fabric shirt at center appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a44607fe593c61c.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of white cotton t-shirt at left in the image." }, { "from": "gpt", "value": "[(0.272, 0.650)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81cfc39f2d37e32c.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.526, 0.739) come farther from viewer compared to point (0.893, 0.188)?" }, { "from": "gpt", "value": "No, (0.526, 0.739) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95c0f21c39c87c87.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.168, 0.230) and point (0.444, 0.234), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.444, 0.234) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6606d45c3ac73ce.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the red matte snowboard at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.537, 0.564)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ccdfa54d5956d95a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the gray concrete sidewalk at lower left and want to place the dark gray cotton shirt at lower left on the sidewalk. Will the shirt fit entirely on the sidewalk without overlapping the edges?" }, { "from": "gpt", "value": "The gray concrete sidewalk at lower left is wider than the dark gray cotton shirt at lower left, so the shirt will fit entirely on the sidewalk without overlapping the edges." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a97d9d1a255d8cd3.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of silver metallic suv at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.916, 0.581)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf523ac7463f94ea.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, yellow matte eagle at center or matte black shirt at center?" }, { "from": "gpt", "value": "matte black shirt at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33ae4dacdefb309b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room described and need to locate the white striped shirt at left. According to the coordinates given, where should you look to find it?" }, { "from": "gpt", "value": "The white striped shirt at left is located at coordinates point (0.231, 0.670)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/219779a3319f3b0c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the rural area and want to approach both the brown mud hut at right and the white printed shirt at left. Which one will you reach first?" }, { "from": "gpt", "value": "You will reach the brown mud hut at right first because it is closer to you than the white printed shirt at left, which is further away." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1a80bfaf4eb4236.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing an event and need to place the black matte jacket at center and the white paper at center on a shelf. Which item should you place first if you want the other to be on top?" }, { "from": "gpt", "value": "The black matte jacket at center should be placed first on the shelf because it is below the white paper at center, so placing it first allows the white paper at center to be placed on top of it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9000283e8e82983.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a frozen ice at lower left. Pinpoint a point to the frozen ice at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.422, 0.825)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bb92ac6b4ba3970.jpg", "conversations": [ { "from": "human", "value": "\nLocate black matte mug at center in the image." }, { "from": "gpt", "value": "[(0.472, 0.536)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14b7abc0f98c6a2e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, golden reflective water at center or wooden dark boat at center, stands shorter?" }, { "from": "gpt", "value": "Standing shorter between the two is golden reflective water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/536d16bf4522e6e9.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown hair at lower right have a larger size compared to white textured cauliflower at center?" }, { "from": "gpt", "value": "Yes, brown hair at lower right is bigger than white textured cauliflower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34f612d163f3cc8b.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.694, 0.577) and point (0.011, 0.492), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.694, 0.577) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0224cf6f478e93a2.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, rugged brown cliff at upper left or matte black coat at center?" }, { "from": "gpt", "value": "With more height is rugged brown cliff at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc57f9d7b01f89f5.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black suit at center have a lesser height compared to orange silk tie at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65372f1a83f36390.jpg", "conversations": [ { "from": "human", "value": "\nDoes concrete sidewalk at center right have a lesser height compared to white cotton shirt at center?" }, { "from": "gpt", "value": "No, concrete sidewalk at center right is not shorter than white cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e86635e1950aa93f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a fashion designer observing the scene and notice two white garments at the center of the path. Which one is taller between the matte white jacket at center and the fluffy white sweater at center?" }, { "from": "gpt", "value": "The matte white jacket at center is taller than the fluffy white sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/378e142118318cfb.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.529, 0.986) or (0.478, 0.489)?" }, { "from": "gpt", "value": "The point (0.478, 0.489) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59c1eae05a0c864c.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.205, 0.406) closer to viewer compared to point (0.484, 0.838)?" }, { "from": "gpt", "value": "No, (0.205, 0.406) is further to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/268dc8da5ae6fe42.jpg", "conversations": [ { "from": "human", "value": "\nHow close is matte yellow tower at upper center from brown shingles at center?" }, { "from": "gpt", "value": "487.05 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9469fe079a37e6f7.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the yellow leather jacket at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.050, 0.292)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e036bf9d9f5588f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the building on the left side of the street and want to find the dark green fur coat at lower right. According to the coordinates provided, is the coat closer to the street or the building?" }, { "from": "gpt", "value": "The dark green fur coat at lower right is located at point 0.791 on the x and 0.904 on the y axis. Since the coordinates are relative to the image, the lower right corner is at (1.000, 1.000). The coat is closer to the street because its x coordinate is 0.791, which is closer to 1 than to 0, indicating proximity to the right side of the image, which corresponds to the street side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b01084e4a3c439dc.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.298, 0.966) and point (0.089, 0.964), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.298, 0.966) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7b167f1709b6fdf.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.496, 0.917)?" }, { "from": "gpt", "value": "brown dry grass at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d07acc0a43c3e3b5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a stagehand standing at the front of the stage. You need to move a heavy equipment from the back of the stage to the front. There are two points marked on the stage. The first point is at point (0.444, 0.542) and the second point is at point (0.516, 0.858). Which point should you pass through first to reach the front?" }, { "from": "gpt", "value": "Point (0.444, 0.542) is behind point (0.516, 0.858), so you should pass through point (0.516, 0.858) first to reach the front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3baeac55257546d2.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is purple matte shirt at center from camera?" }, { "from": "gpt", "value": "21.34 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/684d9278bb632218.jpg", "conversations": [ { "from": "human", "value": "\nIs dark blue jacket at center bigger than gray woolen hat at lower right?" }, { "from": "gpt", "value": "No, dark blue jacket at center is not bigger than gray woolen hat at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00cd34a0e0690228.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked by the coordinates point (0.846, 0.642). You want to walk to the airplane window. How far do you need to walk?" }, { "from": "gpt", "value": "The distance between point (0.846, 0.642) and the viewer is 5.65 meters, so you need to walk 5.65 meters to reach the airplane window." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de9f0477fe2b0e84.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, brown glass bottle at center or translucent glass at left?" }, { "from": "gpt", "value": "Positioned to the left is translucent glass at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6969e66b7204e53.jpg", "conversations": [ { "from": "human", "value": "\nHow close is matte blue jacket at center from camera?" }, { "from": "gpt", "value": "They are 35.67 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/846156c080fc8bab.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if rugged rock mountain range at center is positioned to the right of gray metallic train track at lower center?" }, { "from": "gpt", "value": "No, rugged rock mountain range at center is not to the right of gray metallic train track at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/648d1d4864c13f89.jpg", "conversations": [ { "from": "human", "value": "\nYou are an interior designer planning to place a new lamp between the black plastic drawer at lower left and the black glossy monitor at upper right. Considering their heights, which object should the lamp be placed closer to in order to ensure stability?" }, { "from": "gpt", "value": "The black plastic drawer at lower left has a greater height compared to the black glossy monitor at upper right. To ensure stability, the lamp should be placed closer to the taller object, so the lamp should be placed closer to the black plastic drawer at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62c60572b0adbeef.jpg", "conversations": [ { "from": "human", "value": "\nYou are a plumber who needs to install a pipe connecting the two black polished sinks at center. The pipes you have are 3 feet long. Will the pipes be long enough?" }, { "from": "gpt", "value": "The black polished sinks at center are 3.58 feet apart. The pipes you have are only 3 feet long, so they are not long enough to connect the two sinks." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f25ca92c947101c4.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, camouflage uniform at center or camouflage uniform at left?" }, { "from": "gpt", "value": "camouflage uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdf74052b1bb0873.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.199, 0.486)?" }, { "from": "gpt", "value": "dark gray cloud at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90c9cd19ff2861cd.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow matte clownfish at center to the left of glossy blue fish at upper right from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, yellow matte clownfish at center is positioned on the left side of glossy blue fish at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba1c1b6ef0a7078b.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.818, 0.336) closer to viewer compared to point (0.145, 0.598)?" }, { "from": "gpt", "value": "No, (0.818, 0.336) is further to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b398d1669911f319.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver approaching the resort complex. You need to park your shiny silver car at lower right near the beige stone hotel at right. Based on the scene, can you drive your car directly to the hotel without moving any other vehicles?" }, { "from": "gpt", "value": "The beige stone hotel at right is positioned over the shiny silver car at lower right, which means the car is already parked near the hotel. Therefore, you don not need to move any other vehicles to park there." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5287d11eec0cf1a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing on the rocky outcrop in the foreground. You want to capture a photo that includes both the smooth blue water at center and the green leafy island at center. Which object will appear larger in the photo?" }, { "from": "gpt", "value": "The smooth blue water at center will appear larger in the photo because it has a greater height compared to the green leafy island at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1538710ef148cbb0.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green matte shirt at center less distant than that of green fabric shirt at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/204d7dbc801799c9.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of translucent glass balloon at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.724, 0.153)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22e30e8baab09f99.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a wooden deck at center. Pinpoint a point to the wooden deck at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.423, 0.792)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8b29446f9d4f155.jpg", "conversations": [ { "from": "human", "value": "\nYou are a birdwatcher observing the scene. You notice the brown rough tree trunk at center and the brown speckled feathers at upper center. Which object is taller?" }, { "from": "gpt", "value": "The brown rough tree trunk at center is taller than the brown speckled feathers at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01005cf764611062.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect analyzing the urban skyline. You observe the matte glass building at left and the dark glass building at center. Which building has a taller structure?" }, { "from": "gpt", "value": "The matte glass building at left has a greater height compared to the dark glass building at center, so it is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/257d7745ad2321f4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator tasked with flying a drone from the glassy silver tower at center to the shiny metallic spire at right. The drone has a maximum flight range of 120 meters. Based on the scene, can the drone reach its destination?" }, { "from": "gpt", "value": "The distance between the glassy silver tower at center and the shiny metallic spire at right is 131.69 meters. Since the drone can only fly up to 120 meters, it cannot reach the destination without recharging or refueling." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcf6036ff2150ed4.jpg", "conversations": [ { "from": "human", "value": "\nDoes translucent plastic forehead at center appear on the left side of matte white nose at center?" }, { "from": "gpt", "value": "In fact, translucent plastic forehead at center is to the right of matte white nose at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c80949ebb368f114.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from dark green shorts at center to camera." }, { "from": "gpt", "value": "A distance of 12.93 meters exists between dark green shorts at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f77b13bcc9376f6.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the brown sandy ground at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.696, 0.681)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d34a623107171c0c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the garden looking at the pile of black plastic bags. There are two points marked in the image. One is at coordinate point (0.520, 0.738) and the other is at point (0.318, 0.005). Which point is closer to you?" }, { "from": "gpt", "value": "Point (0.520, 0.738) is closer to the viewer than point (0.318, 0.005)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2fb96b5001e2180.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green leafy tree at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.504, 0.155)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9dd2e10b0bb3d46.jpg", "conversations": [ { "from": "human", "value": "\nYou are an animal behaviorist observing the scene. The tabby fur cat at center is positioned in a specific location. Can you determine if the cat is closer to the person or farther away based on its coordinates?" }, { "from": "gpt", "value": "The tabby fur cat at center is located at point (0.616, 0.731), which places it centrally and slightly towards the right, indicating it is resting against the person and thus close to them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a25fd49d5ee261ea.jpg", "conversations": [ { "from": "human", "value": "\nIs orange floral dress at lower left taller than white paper plate at lower center?" }, { "from": "gpt", "value": "Indeed, orange floral dress at lower left has a greater height compared to white paper plate at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/542d2921c7965d9f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the outdoor scene and want to place a small garden gnome that requires 2 meters of space between it and the viewer. Can the green grass at lower center accommodate the gnome?" }, { "from": "gpt", "value": "The green grass at lower center is 2.18 meters away from the viewer, which is more than the required 2 meters, so the gnome can be placed there." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/961ff302f16777f4.jpg", "conversations": [ { "from": "human", "value": "\nDoes wet fur otter at lower left lie in front of shiny brown otter at center?" }, { "from": "gpt", "value": "Yes, wet fur otter at lower left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf81e649b6cfc2e5.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow matte shorts at left to the right of black matte referee uniform at right from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, yellow matte shorts at left is not on the right side of black matte referee uniform at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68a367496c889e08.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and need to capture a photo where the matte white screen at upper left and the matte black suit at center are both visible. Given that the screen is taller than the suit, how should you adjust your camera angle to ensure both are fully in frame?" }, { "from": "gpt", "value": "Since the matte white screen at upper left is taller than the matte black suit at center, you should angle the camera upwards slightly to capture the full height of the screen while still including the suit in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00a554e4545e8b5d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of orange carved pumpkin at center in the image." }, { "from": "gpt", "value": "[(0.534, 0.406)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a83ece066de187b0.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.674, 0.483) and point (0.703, 0.769), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.674, 0.483) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83ad013ba9b3c44a.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of blue fleece jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.299, 0.536)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2050c25afeabcea3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white striped fabric at center is bigger than purple plastic glasses at upper left?" }, { "from": "gpt", "value": "Correct, white striped fabric at center is larger in size than purple plastic glasses at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/404b62d0d4705d25.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear glass beer at center is smaller than striped fabric shirt at upper center?" }, { "from": "gpt", "value": "Correct, clear glass beer at center occupies less space than striped fabric shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0894bdc3bae9c41e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room and want to know the exact position of the white sheer curtain at upper center. Can you tell me its coordinates?" }, { "from": "gpt", "value": "The white sheer curtain at upper center is located at coordinates point (0.530, 0.156)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5969ae3a4225d5f5.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the beige matte suv at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.815, 0.823)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7530f557b7d51c4b.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a closeup of the dark brown hair at lower left and the white matte shirt at upper center. Which object should you focus on first to ensure both are in focus?" }, { "from": "gpt", "value": "The dark brown hair at lower left is closer to the viewer than the white matte shirt at upper center. To ensure both are in focus, you should focus on the dark brown hair at lower left first." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1833b26fd0a5ac77.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any gray rough rock at center in the image." }, { "from": "gpt", "value": "[(0.384, 0.505)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b0655692de6d46e.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.408, 0.784) and point (0.639, 0.697), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.639, 0.697) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ee6b53585ead951.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.558, 0.863)?" }, { "from": "gpt", "value": "green plastic pavement at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b13b5d3da9ec68cc.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.864, 0.192)?" }, { "from": "gpt", "value": "green textured tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d053b16407a0b1bc.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a matte purple dress at left. Pinpoint a point to the matte purple dress at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.329, 0.406)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3493fc7f358b5eb.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green leafy tree at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.615, 0.087)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fba39bbeaef3fd39.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white paper at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.609, 0.722)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7a39963c30f5608.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and want to capture a photo of the black and white dress at center and the smooth black hair at center. Which object would you need to adjust your camera settings for to ensure proper focus if the dress is wider than the hair?" }, { "from": "gpt", "value": "The black and white dress at center is wider than the smooth black hair at center, so you should adjust your camera settings to focus on the dress to account for its larger size." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1afaf4bfb1271dee.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the white bird in the center. The bird is at point (0.363, 0.630). You need to adjust your camera to focus on the bird. What is the exact location of the bird?" }, { "from": "gpt", "value": "The bird is located at point (0.363, 0.630)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd15bf381d29128e.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.980, 0.697) from camera?" }, { "from": "gpt", "value": "22.88 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e49385a2978b6038.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of silvery gray fur at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.488, 0.508)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ab27f26820b9e45.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black lantern at upper right have a smaller size compared to matte glass candle at center?" }, { "from": "gpt", "value": "No, matte black lantern at upper right is not smaller than matte glass candle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efd7a6dd7c8cada5.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the conference room and need to find the matte white shirt at center. According to the coordinates provided, where should you look relative to the bottom left corner of the image?" }, { "from": "gpt", "value": "The matte white shirt at center is located at point coordinates 0.555 along the x axis and 0.889 along the y axis relative to the bottom left corner of the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2e320761068942b.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at left have a larger size compared to metallic lattice tower at upper left?" }, { "from": "gpt", "value": "No, green leafy tree at left is not bigger than metallic lattice tower at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c76fc460952297a9.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the granite rock at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.178, 0.772)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46b17825674fcc80.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.472, 0.831) come in front of point (0.499, 0.358)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d2dcb67f21ca6a6.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.408, 0.616) positioned after point (0.925, 0.425)?" }, { "from": "gpt", "value": "No, (0.408, 0.616) is in front of (0.925, 0.425)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae78323fe57707cc.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, matte plastic teddy bears at upper left or matte blue fabric shirt at upper center?" }, { "from": "gpt", "value": "Positioned lower is matte blue fabric shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b42c53dee01ed88.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.700, 0.550) from camera?" }, { "from": "gpt", "value": "Point (0.700, 0.550) and camera are 23.34 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/581934d247b3b7fd.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of black silhouette giraffe at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.291, 0.491)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7ecce184712f561.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the high-visibility fabric safety vest at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.670, 0.497)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11179533f056312d.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between rusty metal door at center and camera." }, { "from": "gpt", "value": "rusty metal door at center and camera are 44.48 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af04d28979d1ad30.jpg", "conversations": [ { "from": "human", "value": "\nPoint to polished bronze statue at upper center.Point to the polished bronze statue at upper center in the image." }, { "from": "gpt", "value": "[(0.653, 0.161)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de0638304094ae87.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the wooden pier and want to walk towards the water. You see two points marked on the pier, point 1 at coordinates point (0.817, 0.905) and point 2 at coordinates point (0.814, 0.605). Which point is closer to you as you face the water?" }, { "from": "gpt", "value": "Point 1 at coordinates point (0.817, 0.905) is closer to you because it is further to the viewer than point 2 at coordinates point (0.814, 0.605)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d6fb6088301ec27.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the knitted fabric placemat at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.692, 0.806)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d64b8a7f5735d1c4.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from royal blue satin dress at left to camera." }, { "from": "gpt", "value": "A distance of 5.08 feet exists between royal blue satin dress at left and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f69dd4e4c115a05e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, gray cotton t-shirt at center or white plastic table at center, stands shorter?" }, { "from": "gpt", "value": "With less height is white plastic table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a6f75c80ab1e2fc.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.319, 0.917)?" }, { "from": "gpt", "value": "black plastic camera at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92eacc922bb132c2.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.538, 0.766) in the image. What material are you standing on?" }, { "from": "gpt", "value": "You are standing on gray gravel at center at point (0.538, 0.766)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65f6e6dff0c8840b.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to navigate through the scene. You need to pass between the green metallic cart at center and the light gray fabric shirt at center. Which side of the cart should you go around to avoid the person?" }, { "from": "gpt", "value": "Since the green metallic cart at center is on the left side of the light gray fabric shirt at center, you should go around the right side of the green metallic cart at center to avoid the person." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2b7c8ce4b8087e4.jpg", "conversations": [ { "from": "human", "value": "\nDoes printed fabric dress at center lie in front of printed cotton dress at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25a15f024ebf1920.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, matte red dress at center or black printed blouse at center?" }, { "from": "gpt", "value": "matte red dress at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4e4b8fda19b1ad0.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.400, 0.481) or point (0.829, 0.477)?" }, { "from": "gpt", "value": "The point (0.829, 0.477) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d07ab9cb4655af09.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth stone rocks at center wider than golden yellow leaves at upper left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bbeb2de94882e18.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of clear glass window at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.360, 0.381)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23323f80c037cd73.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.165, 0.877)?" }, { "from": "gpt", "value": "blue fabric table at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14a73ba5831b688e.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.542, 0.228) or (0.817, 0.784)?" }, { "from": "gpt", "value": "The point (0.542, 0.228) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0cda635d6851fde7.jpg", "conversations": [ { "from": "human", "value": "\nBetween brown murky water at center and green grass at center, which one is positioned lower?" }, { "from": "gpt", "value": "brown murky water at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/026826a0e459af6a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, shiny red sweater at center or dark blue jeans at center?" }, { "from": "gpt", "value": "dark blue jeans at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8859d1edd0a099d2.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.958, 0.492)?" }, { "from": "gpt", "value": "644.58 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b3d70202edfc543.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.516, 0.362) or (0.015, 0.511)?" }, { "from": "gpt", "value": "Point (0.516, 0.362)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a321402a85ee2c8.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny brown canoe at center further to camera compared to yellow life vest at center?" }, { "from": "gpt", "value": "No, it is in front of yellow life vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f55a015e504bb7b4.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.124, 0.739) behind point (0.450, 0.662)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/144d3a1fe2d22b36.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from water at lower center to camera." }, { "from": "gpt", "value": "water at lower center and camera are 19.45 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcd0b5b91d1c3c34.jpg", "conversations": [ { "from": "human", "value": "\nIs green silk blouse at upper right shorter than green beaded bracelet at lower right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fccd9d1d4f510dc.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.948, 0.912)?" }, { "from": "gpt", "value": "blonde hair at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8a78182f6060579.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, green concrete stairs at center or matte orange shirt at center?" }, { "from": "gpt", "value": "matte orange shirt at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5361b0045c3c146.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up a shoot for a pet photoshoot. You have two dogs wearing costumes. The black matte costume at center and the white fabric dress at left. You need to position them side by side so that their costumes don not overlap. Based on the scene description, which costume should be placed closer to the camera to prevent overlapping?" }, { "from": "gpt", "value": "The white fabric dress at left should be placed closer to the camera because the black matte costume at center might be wider than the white fabric dress at left, so positioning the narrower one closer will help prevent overlap." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cdd9497015181c41.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the lounge area and see the blue cotton shirt at right and the white fabric bag at center. Which object is positioned more to the right side of the scene?" }, { "from": "gpt", "value": "The blue cotton shirt at right is positioned more to the right side of the scene compared to the white fabric bag at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6f19347088fbd0f.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.324, 0.469) come closer to viewer compared to point (0.544, 0.147)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9785d0a50006ec2.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.098, 0.847) farther from camera compared to point (0.495, 0.664)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfab325c3769d825.jpg", "conversations": [ { "from": "human", "value": "\nPoint to silhouette hooded coat at center.Point to the silhouette hooded coat at center in the image." }, { "from": "gpt", "value": "[(0.427, 0.928)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8010c66823acc271.jpg", "conversations": [ { "from": "human", "value": "\nIs camouflage jacket at right bigger than white fabric coat at center?" }, { "from": "gpt", "value": "No, camouflage jacket at right is not bigger than white fabric coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d6527a74014865e.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of brown cotton shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.521, 0.655)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d89ea63880131c56.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the edge of the grassy area. You want to take a photo of the green grass at lower center and the translucent plastic bottle at lower left. Which object should you focus on first if you want to capture both in a single frame without moving your camera?" }, { "from": "gpt", "value": "You should focus on the translucent plastic bottle at lower left first because it is above the green grass at lower center, so adjusting the focus to start with the closer object ensures both will be in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4e6d884a33d3802.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a candid shot of the wet hair at center and the white matte baseball cap at upper center. Since the background is blurred, can you tell which object is closer to the camera based on their positions?" }, { "from": "gpt", "value": "The wet hair at center is closer to the camera than the white matte baseball cap at upper center because it is positioned in front of it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e424f5f42ab98032.jpg", "conversations": [ { "from": "human", "value": "\nYou are a visitor driving through Kansas and see the blue painted wood sign at center and the blue plastic sign at center. Which one is taller?" }, { "from": "gpt", "value": "The blue painted wood sign at center is taller than the blue plastic sign at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c9d5e82be1c59f9.jpg", "conversations": [ { "from": "human", "value": "\nDoes silhouette tree at left lie in front of green matte tree at center?" }, { "from": "gpt", "value": "Yes, silhouette tree at left is in front of green matte tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f65a018f1e3b9b8.jpg", "conversations": [ { "from": "human", "value": "\nLocate all matte black golf club at center in the image." }, { "from": "gpt", "value": "[(0.512, 0.667)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f228dbb3f97b605d.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.381, 0.564) or (0.505, 0.867)?" }, { "from": "gpt", "value": "Positioned in front is point (0.505, 0.867)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00b211e7adf55636.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.678, 0.564) and point (0.466, 0.662), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.678, 0.564)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/439e628dfcb297d0.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.518, 0.725) and point (0.410, 0.748), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.518, 0.725)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/210e36dd60bf88b6.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.288, 0.806) or point (0.548, 0.537)?" }, { "from": "gpt", "value": "Point (0.288, 0.806) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7a8ecfd6d3ef4a0.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy sedan at center to the left of white matte sedan at center from the viewer's perspective?" }, { "from": "gpt", "value": "Correct, you'll find white glossy sedan at center to the left of white matte sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6fe62b6fce5b19ae.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the post office scene and want to place a small package between the two points labeled point (0.199, 0.688) and point (0.409, 0.694). Which point should the package be closer to so it is placed in front?" }, { "from": "gpt", "value": "The package should be closer to point (0.199, 0.688) because it is in front of point (0.409, 0.694)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6b00c70e11ecc3f.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white textured dress at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.329, 0.597)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/008ef43e209de737.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to place a decorative bowl between the powdery brown pastry at upper left and the dark purple jam at center on the table. Based on their sizes, can you estimate whether there will be enough space between them to fit the bowl?" }, { "from": "gpt", "value": "The powdery brown pastry at upper left might be wider than dark purple jam at center, so there may not be enough space between them to fit the bowl unless it is very small." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83dee15360d68d38.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte black ski at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.652, 0.838)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/389ef9070b707ec5.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the cloudy sky at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.481, 0.214)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ee874f1c2453c81.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the transparent glass pool at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.502, 0.778)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e7368e55eb1841c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if knitted wool sweater at center is bigger than metallic silver microphone at center?" }, { "from": "gpt", "value": "Indeed, knitted wool sweater at center has a larger size compared to metallic silver microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0017f72c2f2692c3.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte sweater at center have a greater width compared to purple cotton shirt at center?" }, { "from": "gpt", "value": "Incorrect, black matte sweater at center's width does not surpass purple cotton shirt at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/683ff06e75caeda9.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.033, 0.944) behind point (0.392, 0.858)?" }, { "from": "gpt", "value": "No, (0.033, 0.944) is in front of (0.392, 0.858)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09d87af81aa6b8cd.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of matte black pavement at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.464, 0.802)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbdaa40d675413d4.jpg", "conversations": [ { "from": "human", "value": "\nYou are driving and want to know the position of the green leafy tree at right relative to the center of the windshield. Is it to the left or right of the center?" }, { "from": "gpt", "value": "The green leafy tree at right is located at point 0.225 on the x axis, which is to the left of the center of the windshield." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8933068de6e500a5.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the matte yellow paper at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.300, 0.305)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c379e74ca71adf5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a birdwatcher observing the scene. You notice the white fluffy birds at left and the green leafy tree at upper right. Which object occupies more space in the image?" }, { "from": "gpt", "value": "The white fluffy birds at left has a larger size compared to the green leafy tree at upper right, so the white fluffy birds at left occupies more space in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f5639a61ce987f8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tailor trying to determine if the denim at center can cover the matte black boot at center. Based on the size comparison provided, what is your assessment?" }, { "from": "gpt", "value": "The denim at center is smaller than the matte black boot at center, so it cannot fully cover the boot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b80d82c5f5ff256.jpg", "conversations": [ { "from": "human", "value": "\nDoes white silky water at left lie behind clear water at right?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a582b5b684fb5291.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect designing a new building and want to incorporate two black metal poles in the design. You have a limited budget and can only use one type of metal pole. Based on the image, which pole would be more cost effective to replicate, the black metal pole at center or the black metal pole at left?" }, { "from": "gpt", "value": "The black metal pole at center is thinner than the black metal pole at left, so replicating the black metal pole at center would be more cost effective as it requires less material." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da2c4aa1639939f8.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy cruise ship at center have a greater width compared to clear blue water at lower center?" }, { "from": "gpt", "value": "Yes, white glossy cruise ship at center is wider than clear blue water at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8347fdf4dc828f42.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.496, 0.117) and camera." }, { "from": "gpt", "value": "Point (0.496, 0.117) is 4.81 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f698ffbf306efcc0.jpg", "conversations": [ { "from": "human", "value": "\nHow far is metallic gray water tower at upper center from metallic green water tower at upper left?" }, { "from": "gpt", "value": "metallic gray water tower at upper center is 63.38 meters from metallic green water tower at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd0cd09428b7751c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer in a store looking to place both the metallic silver table at center and the brown silky hair at upper right on a shelf. The shelf has a width of 1.2 meters. Can both items fit side by side on the shelf without overlapping?" }, { "from": "gpt", "value": "The metallic silver table at center might be wider than brown silky hair at upper right. Since the shelf is 1.2 meters wide, it is uncertain if both items can fit side by side without overlapping because the exact widths are not provided." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e14a9e64b1bd7f03.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.453, 0.562) or point (0.533, 0.505)?" }, { "from": "gpt", "value": "Point (0.533, 0.505) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5f9fbd41261b723.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the dirt path and looking towards the wooden gate. Which object, the brown soil at center or the dark gray fluffy cloud at upper left, is closer to you?" }, { "from": "gpt", "value": "The brown soil at center is closer to you because it is taller than the dark gray fluffy cloud at upper left, indicating it occupies a lower position in the visual field." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01e727d10126f7ab.jpg", "conversations": [ { "from": "human", "value": "\nYou are a character in the image standing at the center of the room. You want to pick up the matte red dress at center to try it on. Which direction should you move to reach it?" }, { "from": "gpt", "value": "Since the matte red dress at center is located at point coordinates of (0.467, 0.348), you should move towards the center of the room to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b6962a9afc4998e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the open grassy area looking at the two rockets. Which of the two points, point (0.661, 0.463) or point (0.894, 0.087), appears closer to you?" }, { "from": "gpt", "value": "Point (0.661, 0.463) is closer to the camera than point (0.894, 0.087), so it appears closer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87ca67b48d645858.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white leather jacket at lower right is shorter than green fabric jacket at center?" }, { "from": "gpt", "value": "In fact, white leather jacket at lower right may be taller than green fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db8183cc7384db86.jpg", "conversations": [ { "from": "human", "value": "\nYou are a passenger waiting at the train station. You see the white glossy train at left and the metallic train track at right. Which object is nearer to you?" }, { "from": "gpt", "value": "The white glossy train at left is closer to the viewer than the metallic train track at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55e7e185dd9a078d.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.600, 0.614) come closer to viewer compared to point (0.603, 0.980)?" }, { "from": "gpt", "value": "Yes, point (0.600, 0.614) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc2cb85fa7bd5f18.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of dark gray suit at center less distant than that of suede beige blazer at right?" }, { "from": "gpt", "value": "No, dark gray suit at center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82e20682ac680997.jpg", "conversations": [ { "from": "human", "value": "\nYou are attending a formal event and notice two items on the speaker at center. Which item is taller between the dark suit at center and the dark purple dotted tie at center?" }, { "from": "gpt", "value": "The dark suit at center is taller than the dark purple dotted tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96f5403b08ad8d13.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny chrome motorcycle at left further to the viewer compared to blue glossy motorcycle at right?" }, { "from": "gpt", "value": "No, shiny chrome motorcycle at left is in front of blue glossy motorcycle at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37720b8dd6fd9b1e.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of green grassy hillside at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.325, 0.231)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d29f1f8e45d30b66.jpg", "conversations": [ { "from": "human", "value": "\nBetween brown leather jacket at center and matte black coat at lower left, which one is positioned lower?" }, { "from": "gpt", "value": "matte black coat at lower left is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea8a16f391498528.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue fabric curtain at right is positioned to the right of dark carpeted stairs at center?" }, { "from": "gpt", "value": "Correct, you'll find blue fabric curtain at right to the right of dark carpeted stairs at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f6a460934f701e1.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden furniture at center appear under yellow matte car at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec162ded4aff0df4.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.536, 0.716) or (0.584, 0.452)?" }, { "from": "gpt", "value": "Point (0.584, 0.452)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efd970d18e79ea0c.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.625, 0.408) farther from viewer compared to point (0.102, 0.847)?" }, { "from": "gpt", "value": "No, (0.625, 0.408) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c42e8f1fe2a5e9ac.jpg", "conversations": [ { "from": "human", "value": "\nBetween orange plastic kayak at lower right and skinny barefoot at lower right, which one is positioned higher?" }, { "from": "gpt", "value": "orange plastic kayak at lower right is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb284ea473dbef41.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white cotton shirt at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.830, 0.472)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d92aad89275623a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy jungle at upper center is positioned to the right of dark brown fuzzy beard at center?" }, { "from": "gpt", "value": "Indeed, green leafy jungle at upper center is positioned on the right side of dark brown fuzzy beard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85af1d4329876af4.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.954, 0.722)?" }, { "from": "gpt", "value": "black and white shirt at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73f454fdba0799cc.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of white matte shirt at center from camera?" }, { "from": "gpt", "value": "A distance of 1.18 meters exists between white matte shirt at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4eee9939fe6b26c.jpg", "conversations": [ { "from": "human", "value": "\nBetween gray asphalt path at center and green wooden bench at center, which one is positioned higher?" }, { "from": "gpt", "value": "green wooden bench at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07770330f46910e5.jpg", "conversations": [ { "from": "human", "value": "\nIs dark green matte coat at upper right closer to camera compared to matte black jacket at left?" }, { "from": "gpt", "value": "Yes, it is in front of matte black jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0275742ec2735b06.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte boat at lower left taller than metallic silver boat at lower center?" }, { "from": "gpt", "value": "No, white matte boat at lower left is not taller than metallic silver boat at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/124c2b8fbf15b67f.jpg", "conversations": [ { "from": "human", "value": "\nIs light pink fabric scarf at center taller than yellow fabric jacket at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54ecd3be07f11e16.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer taking a picture of the soldiers in formation. You notice the camouflage fabric us army uniform at left and the camouflage fabric patch at center. Which object should you focus on first if you want to capture both in sharp focus?" }, { "from": "gpt", "value": "The camouflage fabric us army uniform at left is closer to the viewer than the camouflage fabric patch at center. To capture both in sharp focus, you should focus on the camouflage fabric us army uniform at left first, as it is closer, and the depth of field may naturally include the farther object if focused properly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41e244cfc28e4cd8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a gardener checking the growth of the plants in the garden. You see the green leafy plant at upper left and the green leafy plant at lower left. Which one is taller?" }, { "from": "gpt", "value": "The green leafy plant at upper left is taller than the green leafy plant at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32c429e5c73ba775.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of brown leather jacket at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.442, 0.475)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67f47fbc378da855.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between white satin dress at center and camera?" }, { "from": "gpt", "value": "white satin dress at center and camera are 37.66 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f28178448aec1685.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of dark gray matte bird at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.695, 0.158)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8193f7554834b207.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.836, 0.208) and point (0.337, 0.352), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.337, 0.352)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d29d0431540589e3.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.623, 0.778) and camera." }, { "from": "gpt", "value": "Point (0.623, 0.778) is 16.07 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2393a2a907c859f2.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.888, 0.263) from the camera?" }, { "from": "gpt", "value": "A distance of 6.50 meters exists between point (0.888, 0.263) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/079fc666e87850ef.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the dark blue suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.693, 0.534)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9cee2a741f7c79ea.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between green grass at center and camera?" }, { "from": "gpt", "value": "They are 3.60 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09f28354abfa2d27.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.330, 0.864) and point (0.080, 0.358), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.080, 0.358) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/351d11f09f63aade.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance from brown leafless branches at lower left to dark green textured tree at center." }, { "from": "gpt", "value": "brown leafless branches at lower left and dark green textured tree at center are 36.39 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c4a3b24e269d10f.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of green reflective water at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.505, 0.678)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc7e80c8e2ff7b83.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of concrete at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.804, 0.270)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29def1a07418b44f.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.903, 0.473) come closer to viewer compared to point (0.125, 0.008)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24d95f587e695f2e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.496, 0.797)?" }, { "from": "gpt", "value": "green grassy at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea9c8751e29c31b6.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.258, 0.734) positioned in front of point (0.584, 0.039)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.584, 0.039)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a6e437ed5f14cda.jpg", "conversations": [ { "from": "human", "value": "\nYou are an airplane pilot flying over the mountainous area. You need to determine which object in the scene is bigger to navigate safely. According to the image, which one is larger between the rocky mountain range at center and the white fluffy cloud at center?" }, { "from": "gpt", "value": "The rocky mountain range at center is larger in size than the white fluffy cloud at center, so the rocky mountain range at center is the larger object." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1bd8b9b72fadb327.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, black metal grid at center or white textured vent at upper center, stands shorter?" }, { "from": "gpt", "value": "white textured vent at upper center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcb986197c6e3e0e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.284, 0.831)?" }, { "from": "gpt", "value": "dirt/gravel construction site at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9f8de8136b5b91b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.545, 0.591)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/895218891d637031.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gray tortoise at left above leathery gray tortoise at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b8f574daa3baed3.jpg", "conversations": [ { "from": "human", "value": "\nIs striped fabric shirt at center in front of brown hair at center?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ae4cf5b8549ac27.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark wood door at center appear over white cotton shirt at lower center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfede8771e4d9838.jpg", "conversations": [ { "from": "human", "value": "\nYou are navigating through the corridor and need to reach a specific location. There are two points marked in the scene, point 1 at coordinates point (0.812, 0.358) and point 2 at coordinates point (0.727, 0.456). Which point is closer to you as you stand in the corridor?" }, { "from": "gpt", "value": "Point (0.812, 0.358) is closer to the viewer than point (0.727, 0.456), so you are closer to point 1." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7010480f64b9d1e.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of translucent rubber bands at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.831, 0.784)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7bb6094f8cd7e2ce.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer planning to capture a wide landscape shot of the desert scene. You want to ensure that both the white fluffy cloud at upper center and the green matte grassland at lower center are clearly visible in the frame. Given their sizes, which one might require more careful framing to ensure it doesn not get lost in the composition?" }, { "from": "gpt", "value": "The green matte grassland at lower center might require more careful framing since the white fluffy cloud at upper center is wider, making it potentially more dominant in the composition and less likely to be overlooked." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00fe972199aa4500.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between blue rubber boot at center and blue fabric life vest at center." }, { "from": "gpt", "value": "32.81 inches" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bd11c2a0c3076f2.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the dark brown hair at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.604, 0.883)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1aae06efe13490d8.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of gray fabric at center in the image." }, { "from": "gpt", "value": "[(0.762, 0.864)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7c625a90ff14d11.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.490, 0.042) from camera?" }, { "from": "gpt", "value": "A distance of 4.37 meters exists between point (0.490, 0.042) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bfbcc5e4d08eb75.jpg", "conversations": [ { "from": "human", "value": "\nWhere is autumn leaves at upper left located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.471, 0.447)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9fb71bcf3115ee2.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.711, 0.662)?" }, { "from": "gpt", "value": "navy blue sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2aa20165b049a5a2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a zookeeper observing two giraffes in their enclosure. You notice the spotted fur at center and the brown rough rock at lower left. Which object is closer to you, the observer?" }, { "from": "gpt", "value": "The spotted fur at center is closer to you because it is in front of the brown rough rock at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99e753a42da9b0c0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a clear shot of both the teal glossy wig at center and the purple silky wig at center from the ground below. Which wig will appear larger in your photo?" }, { "from": "gpt", "value": "The teal glossy wig at center will appear larger in the photo because it is closer to the viewer than the purple silky wig at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/947603392c8cbea3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden signpost at center-right is smaller than black plastic arrow at upper right?" }, { "from": "gpt", "value": "Actually, wooden signpost at center-right might be larger than black plastic arrow at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be94a62a84720bfd.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.748, 0.419) positioned before point (0.608, 0.666)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b232f2267fa5d9a3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smokey gray cloud at upper center is positioned above green leafy tree at center?" }, { "from": "gpt", "value": "Indeed, smokey gray cloud at upper center is positioned over green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73ede91c5aab6ab3.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the coffee shop bar and want to hang a new decorative banner that is 2 meters tall. The banner needs to be placed above the entrance but must not block the neon purple sign at right. Given the height of the brick at center, can the banner be safely hung without covering the sign?" }, { "from": "gpt", "value": "The brick at center is much taller than the neon purple sign at right, so the banner can be safely hung above the entrance without covering the sign since the brick at center provides sufficient vertical space." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ac03022ad060f2b.jpg", "conversations": [ { "from": "human", "value": "\nDoes satin silver hatchback at lower left appear on the right side of white matte car at center?" }, { "from": "gpt", "value": "In fact, satin silver hatchback at lower left is to the left of white matte car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5ccd254b683c4c3.jpg", "conversations": [ { "from": "human", "value": "\nYou are an antique collector examining the image. You need to place a protective cover over the white stoneware vase at center and the matte ceramic vase at left. Which vase should you cover first if you want to start from the left side of the image?" }, { "from": "gpt", "value": "You should cover the matte ceramic vase at left first because it is positioned to the left of the white stoneware vase at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0c0bd6929bde3c5.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the community center and want to ask someone at the table for information. Which object should you approach first, the smooth plastic table at center or the colored paper sign at upper left?" }, { "from": "gpt", "value": "You should approach the smooth plastic table at center first because it is to the right of the colored paper sign at upper left, meaning it is closer to your position at the entrance." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/194fb4a3ef15fa16.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white striped shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.441, 0.589)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9a016aeac05774f.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.899, 0.058)?" }, { "from": "gpt", "value": "dark gray coat at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63312c892eb9bd5e.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between concrete stairs at center and camera?" }, { "from": "gpt", "value": "concrete stairs at center is 12.51 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/441eeda9ae326ef4.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.911, 0.533) or (0.131, 0.527)?" }, { "from": "gpt", "value": "The point (0.911, 0.533) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9281b597d98f6aad.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, black matte shirt at center or white marble pillar at left?" }, { "from": "gpt", "value": "white marble pillar at left is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3aba9f960217ed6d.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of light beige jacket at lower right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.821, 0.644)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea17633c7274a6d8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a spectator at the marathon and want to locate the red jacket at center and white matte cap at upper center. Which object is higher up in the image?" }, { "from": "gpt", "value": "The white matte cap at upper center is higher up in the image than the red jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c6266590c45cf13.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.202, 0.773) behind point (0.041, 0.664)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfaed33f9bdc2388.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the path and see the point marked at coordinates (0.897, 0.981). If you want to place a small bench there, how far do you need to walk to reach that point?" }, { "from": "gpt", "value": "The point at coordinates (0.897, 0.981) is 2.86 meters away from you, so you need to walk 2.86 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0aef1e43e2a020ee.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of knitted brown sweater at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.571, 0.713)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8251de67be692894.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at center is positioned above white cotton shorts at center?" }, { "from": "gpt", "value": "Incorrect, green leafy tree at center is not positioned above white cotton shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5900bfcd2732c10.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.511, 0.317) from camera?" }, { "from": "gpt", "value": "8.82 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3bc8d890514f236.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.479, 0.522) and point (0.306, 0.527), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.479, 0.522)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07affc3b90123598.jpg", "conversations": [ { "from": "human", "value": "\nYou are a technician who needs to adjust the distance between the pixelated plastic screen at upper left and the dark gray sweater at lower right to exactly 3 meters for a presentation. Currently, the distance is 2.54 meters. What should you do?" }, { "from": "gpt", "value": "The pixelated plastic screen at upper left is currently 2.54 meters away from the dark gray sweater at lower right. To reach the desired 3 meters, you should move the pixelated plastic screen at upper left further away from the dark gray sweater at lower right by 0.46 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/330916238e40c02b.jpg", "conversations": [ { "from": "human", "value": "\nIs brown/wooden gazebo at center to the right of green leafy tree at upper center from the viewer's perspective?" }, { "from": "gpt", "value": "In fact, brown/wooden gazebo at center is to the left of green leafy tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f39926047bca753.jpg", "conversations": [ { "from": "human", "value": "\nYou are a safety inspector at the construction site. You need to ensure that the blue plastic website at center and the blue fabric construction worker at center are visible to each other for communication. Is there any obstruction between them?" }, { "from": "gpt", "value": "The blue plastic website at center is smaller than the blue fabric construction worker at center, so there is no obstruction between them. They can see each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab08ff1be0274e05.jpg", "conversations": [ { "from": "human", "value": "\nIs light blue shirt at center taller than smooth skin hand at lower right?" }, { "from": "gpt", "value": "Correct, light blue shirt at center is much taller as smooth skin hand at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d28dea4f25f000ba.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a photo shoot and need to place a backdrop behind both the matte blue shirt at left and the matte white blouse at center. Since the backdrop must cover both subjects, which subject requires the backdrop to be placed further back to accommodate their size?" }, { "from": "gpt", "value": "The matte white blouse at center requires the backdrop to be placed further back because it is larger than the matte blue shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef6ebcb1b14d259e.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a picnic and need to place two items in your backpack. You have the clear plastic container at upper center and the white plastic bag at upper center. The backpack has a narrow compartment that can only fit items spaced 6 inches apart. Can both items fit in the compartment without overlapping?" }, { "from": "gpt", "value": "The distance between the clear plastic container at upper center and the white plastic bag at upper center is 6.71 inches. Since the backpack compartment requires items to be spaced 6 inches apart, the 6.71 inches distance is sufficient, so both items can fit without overlapping." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3184422ac873cdbd.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the black polished horse at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.392, 0.469)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13bc0aa50d1a536d.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the crowd at this evening gathering. You see the blue plaid shirt at left and the black knit sweater at center. Which one is positioned more to the left?" }, { "from": "gpt", "value": "The blue plaid shirt at left is positioned more to the left than the black knit sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f9361ff1dc632c5.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a rustic stone planet at upper left. Pinpoint a point to the rustic stone planet at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.303, 0.227)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a02e59e62c697cdc.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of matte orange shirt at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.246, 0.483)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15e8688d2b614862.jpg", "conversations": [ { "from": "human", "value": "\nHow close is black matte snowboard at center from matte black ski at upper left?" }, { "from": "gpt", "value": "They are 8.57 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2d780dd521d2641.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the smooth bark tree at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.387, 0.467)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29d3dc26c25e6bf0.jpg", "conversations": [ { "from": "human", "value": "\nDoes green needle-like foliage at center have a smaller size compared to bronze statue at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac53634385ba2ad6.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent matte helmet at center appear under black matte glasses at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1c01fbe444c574d.jpg", "conversations": [ { "from": "human", "value": "\nIs silver metallic laptop at center positioned before matte black hair at center?" }, { "from": "gpt", "value": "Yes, silver metallic laptop at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78c796517decde42.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the porch and want to place a bird feeder exactly at the center of the white corrugated metal roof at upper center. According to the coordinates provided, what are the exact coordinates where you should place it?" }, { "from": "gpt", "value": "The exact coordinates for placing the bird feeder at the center of the white corrugated metal roof at upper center are 0.178 in the x axis and 0.579 in the y axis." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c82bd95c09844e2.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the dark brown glass tower at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.577, 0.567)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/211dc0a4f428b18a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the tent where the poker game is happening. There are two points marked on the table surface. One is at coordinate point(0.552, 0.388) and the other is at point(0.712, 0.130). Which point is closer to you?" }, { "from": "gpt", "value": "Point(0.552, 0.388) is closer to you because it is further to the viewer than point(0.712, 0.130)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f6654bff41bbf60.jpg", "conversations": [ { "from": "human", "value": "\nIs black glossy laptop at upper left in front of white fur cat at center?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d35e8e3bfb470082.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the transparent glass water at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.553, 0.759)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad47306b172d9bf3.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy hedge at center in front of white marble statue at lower left?" }, { "from": "gpt", "value": "No, green leafy hedge at center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1dbc801d72212a11.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.180, 0.495)?" }, { "from": "gpt", "value": "teal plastic sunglasses at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f1dc51b3b710b29.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.457, 0.697) lie in front of point (0.093, 0.664)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69afa85492ccf978.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the park and want to reach the point marked at coordinates (0.242, 0.192). How far is this point from your current position?" }, { "from": "gpt", "value": "The point marked at coordinates (0.242, 0.192) is 19.30 meters away from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8eb94f4ba05d7a05.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.199, 0.653) less distant than point (0.369, 0.569)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6252af7ea619924.jpg", "conversations": [ { "from": "human", "value": "\nDoes white frosted cake with colorful decorations at lower center lie behind white frosted cake at lower left?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60c498f726624014.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray fabric jacket at center lie behind navy blue fleece at center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/554ed8b82805be50.jpg", "conversations": [ { "from": "human", "value": "\nPoint to black suit at center.Point to the black suit at center in the image." }, { "from": "gpt", "value": "[(0.444, 0.580)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ec9a32c44fe29c6.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.152, 0.770) to camera." }, { "from": "gpt", "value": "Point (0.152, 0.770) and camera are 28.31 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbaf739b8672e16f.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, green grass at center or brown brick barn at right?" }, { "from": "gpt", "value": "Positioned to the right is brown brick barn at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b25cba9a18f63b7.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green matte mountain at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.805, 0.714)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d70885a7f2f97d12.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white mesh hospital bed at center is positioned below brown skin at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b6e81e7b099545c.jpg", "conversations": [ { "from": "human", "value": "\nDoes plush pink fur at left have a smaller size compared to velvet brown coat at upper right?" }, { "from": "gpt", "value": "Correct, plush pink fur at left occupies less space than velvet brown coat at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a77848e567f0c5ea.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.507, 0.241)?" }, { "from": "gpt", "value": "brown shiny hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81b4b8eb85275465.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the protest scene described. You want to take a photo that includes both the point at coordinates point (0.567, 0.573) and point (0.799, 0.147). However, you notice that one of these points is closer to the camera than the other. Which point should you focus on first to ensure both are in focus?" }, { "from": "gpt", "value": "Point (0.567, 0.573) is in front of point (0.799, 0.147), so you should focus on point (0.567, 0.573) first to ensure both are in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf36b6876c7321f9.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the brick steeple at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.899, 0.644)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54ce80a94a568291.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in the park. You want to take a photo that includes both the plaid fabric shirt at center and the matte blue sweater at center. The camera you are using has a focal length that can capture objects up to 1.5 meters apart. Can you capture both items in a single shot without moving the camera?" }, { "from": "gpt", "value": "The distance between the plaid fabric shirt at center and the matte blue sweater at center is 1.71 meters. Since the camera can only capture objects up to 1.5 meters apart, you cannot capture both items in a single shot without moving the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c40a44c796d30b57.jpg", "conversations": [ { "from": "human", "value": "\nYou are a physical therapist observing a patient using crutches. You notice two points marked on the image at coordinates point (0.498, 0.588) and point (0.734, 0.239). Which point is positioned closer to your viewpoint?" }, { "from": "gpt", "value": "Point (0.498, 0.588) is closer to the viewer than point (0.734, 0.239)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3267a6088cdcf3dd.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the scene and want to take a photo of the blue fabric kite at center and the red matte kite at center. Which kite should you focus on first to ensure both are in focus?" }, { "from": "gpt", "value": "You should focus on the blue fabric kite at center first because it is closer to you than the red matte kite at center, so adjusting focus from near to far will help both be in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f7844f382087927.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.394, 0.872) and point (0.428, 0.723), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.394, 0.872)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e593d37a6bad7e9e.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.492, 0.933) or (0.992, 0.683)?" }, { "from": "gpt", "value": "Point (0.492, 0.933)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fe1e8a2c02af758.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black glass at center is shorter than green matte boat at upper left?" }, { "from": "gpt", "value": "Correct, black glass at center is not as tall as green matte boat at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b03ed83a57b25d37.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown suede jacket at center have a lesser height compared to silver metallic mouse at lower right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe6a5ed8ec7c6d63.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.219, 0.845)." }, { "from": "gpt", "value": "dark green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38c786fe0ce393bc.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the barrel and want to place a small flag at two specific points on the barrel. The first point is at coordinates point (0.025, 0.503) and the second point is at point (0.283, 0.156). Which point will require you to reach further back to place the flag?" }, { "from": "gpt", "value": "Point (0.283, 0.156) will require reaching further back because it is farther from the viewer compared to point (0.025, 0.503)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce35d61f768568cf.jpg", "conversations": [ { "from": "human", "value": "\nYou are a maintenance worker needing to reach both the brown wood siding at upper left and the white plastic clock at center. If your ladder can extend up to 20 feet, will you need to move it between the two?" }, { "from": "gpt", "value": "The distance between the brown wood siding at upper left and the white plastic clock at center is 22.16 feet, which is greater than the ladder extension of 20 feet. Therefore, you will need to move the ladder between the two." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05ae31ebac92a732.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.458, 0.914) or point (0.889, 0.561)?" }, { "from": "gpt", "value": "Point (0.889, 0.561)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92e01bad2ac831e4.jpg", "conversations": [ { "from": "human", "value": "\nIs black leather jacket at center positioned in front of light brown fabric jacket at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec0b94b83664f78f.jpg", "conversations": [ { "from": "human", "value": "\nBetween metallic gray garage door at right and printed fabric shirt at center, which one has less height?" }, { "from": "gpt", "value": "Standing shorter between the two is printed fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7481a13ffca5083.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.302, 0.758)?" }, { "from": "gpt", "value": "high visibility reflective jacket at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63b74f01a0924127.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of natural wood table at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.527, 0.328)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26353c9a201a10e0.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of blue fabric mask at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.442, 0.341)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/880ee7d5ce6ebab5.jpg", "conversations": [ { "from": "human", "value": "\nIs gray fuzzy scarf at center to the right of blue reflective plastic goggles at center from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, gray fuzzy scarf at center is not on the right side of blue reflective plastic goggles at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b847f99a1b942742.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.705, 0.653) or (0.768, 0.497)?" }, { "from": "gpt", "value": "Point (0.705, 0.653)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67fab21f9bcac365.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.455, 0.739)?" }, { "from": "gpt", "value": "white glossy rail at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94330447936808cc.jpg", "conversations": [ { "from": "human", "value": "\nIs blue plaid shirt at center in front of matte wood frame at upper center?" }, { "from": "gpt", "value": "Yes, blue plaid shirt at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/616f8573f3a1e97e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a construction worker standing near the excavation. You need to hand a tool to your colleague wearing the blue cotton shirt at upper center. The tool you have is 12 feet long. Can you reach them without moving closer? Please explain your reasoning." }, { "from": "gpt", "value": "The blue cotton shirt at upper center is 11.58 feet from the camera. Since the tool is 12 feet long, which is slightly longer than the distance between you and your colleague, you can reach them without moving closer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/759297feabaf0031.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.190, 0.973) and point (0.053, 0.986), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.190, 0.973) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85006ae56cdf0490.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.493, 0.745)?" }, { "from": "gpt", "value": "matte red jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/089e7eb666ad3d5c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the wedding and need to capture a shot of the matte blue scarf at lower right and the matte black suit at center. Which object is located to the right of the other?" }, { "from": "gpt", "value": "The matte blue scarf at lower right is positioned on the right side of the matte black suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/657239fea8b18c6c.jpg", "conversations": [ { "from": "human", "value": "\nWhere is rusty metal fire escape at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.550, 0.688)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2814e4895226c639.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the clear glass water at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.944, 0.297)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f52e0a491cd83d9c.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the brown speckled sparrow at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.669, 0.605)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00d34f52ddbc35d5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer who needs to adjust the lighting to ensure both the green jersey at center and the matte red blazer at center are equally visible. Considering their sizes, which one might require more focused lighting adjustments?" }, { "from": "gpt", "value": "The green jersey at center is bigger than the matte red blazer at center. Since the green jersey is larger, it might require more focused lighting adjustments to ensure it doesn" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3936211d03c43727.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown matte speaker at left lie in front of white plastic laptop at center?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd0679652e157097.jpg", "conversations": [ { "from": "human", "value": "\nLocate the patterned fabric shawl at center in the image." }, { "from": "gpt", "value": "[(0.626, 0.548)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/845c0d4909a64219.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of matte black shirt at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.382, 0.622)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fbf05c2d31cacf2.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between dark gray jeans at lower right and camera." }, { "from": "gpt", "value": "dark gray jeans at lower right is 23.99 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44ad7c4047d4c720.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.318, 0.570)?" }, { "from": "gpt", "value": "matte blue shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37c3103ebf9d2cd4.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.605, 0.556) or (0.602, 0.545)?" }, { "from": "gpt", "value": "Point (0.602, 0.545)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c8f7b4881845bb0.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of green matte plants at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.227, 0.433)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/922d8124ada09da7.jpg", "conversations": [ { "from": "human", "value": "\nBetween smooth brown hair at upper center and shiny dark hair at center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "Positioned to the left is shiny dark hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cedd9996dc278ac.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.041, 0.633) positioned in front of point (0.634, 0.772)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0a86ed2c1922c1c.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte coat at left to the right of dark gray sweater at center from the viewer's perspective?" }, { "from": "gpt", "value": "In fact, black matte coat at left is to the left of dark gray sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c8646b6755c01a9.jpg", "conversations": [ { "from": "human", "value": "\nDoes snow-covered pine at center have a lesser width compared to green matte evergreen tree at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5051ff8986ff3f35.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the garden and want to take a photo of both the modern art installation and the person taking a photo. The modern art installation is at point (0.971, 0.852) and the person is at point (0.268, 0.481). Since you want to include both in your frame, which point should you focus on first to ensure both are in focus?" }, { "from": "gpt", "value": "You should focus on point (0.268, 0.481) first because it is closer to you than point (0.971, 0.852), which is further away. By focusing on the closer point, you can ensure that both points are within the depth of field." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f6e29d2389d4430.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the white feathered bird at center. You notice the green reflective water at center is in the way. Can you adjust your position to focus on the bird without the water obstructing the view?" }, { "from": "gpt", "value": "The green reflective water at center is closer to the viewer than the white feathered bird at center. To focus on the bird without the water obstructing the view, you should move your position to either side so that the bird is no longer behind the water." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b85d001f6895de57.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black fabric hat at upper center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.410, 0.152)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0121c5c2ed0a73a0.jpg", "conversations": [ { "from": "human", "value": "\nYou are an interior designer observing the traditional Indian ritual scene. You notice the white dotted fabric at lower right and the orange matte at lower right. Which object is positioned higher in the image?" }, { "from": "gpt", "value": "The white dotted fabric at lower right is above the orange matte at lower right, so it is positioned higher in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09a2e4ca8c594916.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist trying to hang a matte black rectangle at center on a wall. The wall has a white paper notepad at lower right already pinned there. How far apart are these two items?" }, { "from": "gpt", "value": "The white paper notepad at lower right is 18.83 centimeters from the matte black rectangle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e401ebb6de52b0a1.jpg", "conversations": [ { "from": "human", "value": "\nIs white plastic keyboard at center taller than beige plastic keyboard at lower center?" }, { "from": "gpt", "value": "Correct, white plastic keyboard at center is much taller as beige plastic keyboard at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da5327c690ac8c99.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker looking at the trail ahead. You notice two backpacks on the ground at the lower left of your view. Which backpack is positioned more to the right between the camouflage fabric backpack at lower left and the purple fabric backpack at lower left?" }, { "from": "gpt", "value": "The camouflage fabric backpack at lower left is positioned more to the right compared to the purple fabric backpack at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e9659b0e78a0469.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person with a large package that requires a 2.5 meter wide doorway. Are the smooth glass doors at center wide enough for your package?" }, { "from": "gpt", "value": "The smooth glass doors at center are 24.46 meters apart, which is much wider than the required 2.5 meters. The package can easily pass through." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/821fa64a2ea426a2.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte fish at center have a lesser width compared to metal corrugated roof at center?" }, { "from": "gpt", "value": "Indeed, white matte fish at center has a lesser width compared to metal corrugated roof at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ebd70e309a4c2f90.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy palm tree at center to the right of illuminated gold christmas tree at center from the viewer's perspective?" }, { "from": "gpt", "value": "In fact, green leafy palm tree at center is to the left of illuminated gold christmas tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bbd973419e2023f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the base of the matte black stair at right and want to reach the transparent glass window at center. How far do you need to walk to get there?" }, { "from": "gpt", "value": "The distance between the matte black stair at right and the transparent glass window at center is 6.13 feet, so you need to walk 6.13 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0001a646b2a73e94.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the red painted concrete amphitheater at lower left without any obstructions. What should you do to ensure the green leafy tree at upper center does not block your view?" }, { "from": "gpt", "value": "Move to a position where the green leafy tree at upper center is behind the red painted concrete amphitheater at lower left, as the tree is currently in front of the amphitheater." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d92a6a2188aca86.jpg", "conversations": [ { "from": "human", "value": "\nBetween black matte shirt at right and dark hair at center, which one is positioned higher?" }, { "from": "gpt", "value": "dark hair at center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83e16d0b5754b270.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any white textured radiator at lower left in the image." }, { "from": "gpt", "value": "[(0.151, 0.891)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75bc9f5a1d5b4845.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of white paper at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.377, 0.134)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00be34d33ad4acc1.jpg", "conversations": [ { "from": "human", "value": "\nBetween green leafy tree at left and green painted wood park bench at lower center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "Positioned to the right is green painted wood park bench at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9af9bc6bba1393e8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the motorsport event and want to capture a photo that includes both the green grass at lower left and the plaid fabric shirt at upper center. Which object should you focus on first to ensure both are in frame?" }, { "from": "gpt", "value": "You should focus on the plaid fabric shirt at upper center first because the green grass at lower left is below it, so adjusting the camera angle to include the upper object will naturally include the lower one as well." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54dbd0b572d04b4a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the historic stone structure and want to walk towards the white glossy light at center. Which direction should you move relative to the dark stone floor at center?" }, { "from": "gpt", "value": "You should move towards the dark stone floor at center because it is in front of the white glossy light at center, meaning the light is behind the floor from your current position at the entrance." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f69442d1006e27a.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of matte brown beetle at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.479, 0.475)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb203027a5b2e927.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a craft event and need to ensure there is enough space for participants. Given the blue fleece jacket at upper center and the wooden table at center, which object takes up more space in the scene?" }, { "from": "gpt", "value": "The wooden table at center takes up more space than the blue fleece jacket at upper center because the blue fleece jacket at upper center has a smaller size compared to wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82ab9b0b9d600900.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the house and want to reach the point marked at coordinates point (0.811, 0.752). If your maximum reach is 7 meters, can you comfortably extend your arm to touch that point?" }, { "from": "gpt", "value": "The distance of point (0.811, 0.752) from viewer is 6.96 meters, so yes, you can comfortably extend your arm to touch that point since it is within your 7 meters reach." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c981b8e53745a380.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to black puffy jacket at center? Please provide its 2D coordinates.Where can I find black puffy jacket at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.109, 0.722)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef7d493b78021e77.jpg", "conversations": [ { "from": "human", "value": "\nYou are an event planner arranging a photoshoot in this room. You need to decide which object, the blonde hair at upper right or the floral fabric dress at center, would be more visible in a wide shot. Based on their sizes, which one should you focus on?" }, { "from": "gpt", "value": "The floral fabric dress at center is larger than the blonde hair at upper right, so focusing on the floral fabric dress at center would make it more visible in a wide shot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4829cb91639f707.jpg", "conversations": [ { "from": "human", "value": "\nWhere is polka dot fabric dress at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.687, 0.384)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c3e243584efe64f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in a forest and see the smooth bark tree at lower right. If you want to take a photo of it with your camera, which has a maximum focus range of 20 meters, will you be able to capture it clearly?" }, { "from": "gpt", "value": "The smooth bark tree at lower right is 21.96 meters away from camera, which exceeds the maximum focus range of 20 meters. Therefore, the camera cannot capture it clearly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72faa027c9080dc7.jpg", "conversations": [ { "from": "human", "value": "\nHow far apart are brown shiny hair at right and translucent plastic glasses at center?" }, { "from": "gpt", "value": "brown shiny hair at right is 24.06 inches from translucent plastic glasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e26073739bfd8fb3.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray fleece at center have a greater height compared to blondehair at right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be1ee721b6cd94da.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, black fabric dodgers shirt at center or white fabric hat at upper right?" }, { "from": "gpt", "value": "Positioned to the left is black fabric dodgers shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51a60b8b636b7e56.jpg", "conversations": [ { "from": "human", "value": "\nDoes red floral tank top at center have a smaller size compared to metallic black bench at center?" }, { "from": "gpt", "value": "No, red floral tank top at center is not smaller than metallic black bench at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35fb26e63eebbb92.jpg", "conversations": [ { "from": "human", "value": "\nDoes white silk dhoti at center have a larger size compared to white silk cloth at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c0e230b91efd059.jpg", "conversations": [ { "from": "human", "value": "\nIs velvet red jacket at center positioned at the back of dark red sweater at center?" }, { "from": "gpt", "value": "No, velvet red jacket at center is in front of dark red sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0d8720231c6d940.jpg", "conversations": [ { "from": "human", "value": "\nYou are a soccer referee observing the match. You notice the matte orange jersey at left and the black and red jersey at center. Which player is positioned higher on the field?" }, { "from": "gpt", "value": "The matte orange jersey at left is positioned higher on the field because it is above the black and red jersey at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40948d9b18329ea5.jpg", "conversations": [ { "from": "human", "value": "\nIs pink fabric jacket at left to the left of white paper at center from the viewer's perspective?" }, { "from": "gpt", "value": "Yes, pink fabric jacket at left is to the left of white paper at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b32591064b6aae94.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.128, 0.855) or (0.375, 0.466)?" }, { "from": "gpt", "value": "The point (0.375, 0.466) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45a7b25b082b53c5.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the scene and see the point marked at coordinates (0.281, 0.772). What object is located at that point?" }, { "from": "gpt", "value": "The point at coordinates (0.281, 0.772) marks the white matte jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a0ca01813a12f04.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green grass at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.775, 0.672)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b291f69ab144b25.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.059, 0.817) or point (0.195, 0.588)?" }, { "from": "gpt", "value": "Point (0.195, 0.588) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/194fc09f9c8a85d6.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is green textured christmas tree at center from white t-shirt at left?" }, { "from": "gpt", "value": "The distance of green textured christmas tree at center from white t-shirt at left is 27.97 inches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8f1019eae140f2e.jpg", "conversations": [ { "from": "human", "value": "\nIs white frosty tree at upper right to the left of white matte ski at center from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, white frosty tree at upper right is not on the left side of white matte ski at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35ec52c9abeb26e0.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.853, 0.195) or point (0.309, 0.448)?" }, { "from": "gpt", "value": "The point (0.309, 0.448) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64a0a7d763449b9b.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown rocky cliff at right appear on the right side of plaid fabric shirt at right?" }, { "from": "gpt", "value": "No, brown rocky cliff at right is not to the right of plaid fabric shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8affb3d49b47392f.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.178, 0.308)?" }, { "from": "gpt", "value": "matte black hand at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c7b01650188a890.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.874, 0.777)?" }, { "from": "gpt", "value": "gray concrete pavement at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b236b0d066f176d5.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.786, 0.514) and camera?" }, { "from": "gpt", "value": "Point (0.786, 0.514) and camera are 78.15 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1c7122505773318.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between gray rock formation at center and camera?" }, { "from": "gpt", "value": "gray rock formation at center is 38.43 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d44755ef8031b5e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.113, 0.441)?" }, { "from": "gpt", "value": "matte black monitor at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b6b7a7f08946512.jpg", "conversations": [ { "from": "human", "value": "\nDoes velvet santa suit at center come behind knitted beige shawl at center?" }, { "from": "gpt", "value": "No, it is in front of knitted beige shawl at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9784ac0ac915ccc8.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between matte black blazer at upper left and camera." }, { "from": "gpt", "value": "A distance of 1.40 meters exists between matte black blazer at upper left and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be9cb4b3068c9d72.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the gold polished statue at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.532, 0.581)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05c9a26d98132d60.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at point point (0.375, 0.727) and want to take a photo of the gymnasts on the blue mat area. The camera you are using has a maximum focus range of 15 feet. Will the camera be able to focus on the gymnasts?" }, { "from": "gpt", "value": "The distance between point (0.375, 0.727) and the camera is 17.41 feet, which exceeds the camera maximum focus range of 15 feet. Therefore, the camera will not be able to focus on the gymnasts." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ee2b8ae2c0049c0.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from brushed metal shirt at center to camera." }, { "from": "gpt", "value": "brushed metal shirt at center is 7.72 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8febcf4f41f01b00.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, red checkered shirt at center or dark blue jersey at left?" }, { "from": "gpt", "value": "dark blue jersey at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e45917dbda715b16.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at upper right wider than green matte tree at lower center?" }, { "from": "gpt", "value": "Yes, green leafy tree at upper right is wider than green matte tree at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7200bdaeccf0789.jpg", "conversations": [ { "from": "human", "value": "\nBetween clear water at lower right and black matte person at lower right, which one has more height?" }, { "from": "gpt", "value": "clear water at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc0f43f96a477e80.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the film festival event. You need to capture a photo of both the smooth skin portrait at center and the dark gray suit at right. Based on their positions, which object should you focus on first to ensure both are in frame?" }, { "from": "gpt", "value": "The dark gray suit at right is behind the smooth skin portrait at center, so you should focus on the smooth skin portrait at center first to ensure both are in frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53ca1811c4ff9cc5.jpg", "conversations": [ { "from": "human", "value": "\nHow far is white plush bear at center from camera?" }, { "from": "gpt", "value": "white plush bear at center is 9.60 inches away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0877c70fa7e97dff.jpg", "conversations": [ { "from": "human", "value": "\nIs green fabric vest at lower left wider than light purple fleece jacket at lower right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08d2bf9067fd29c3.jpg", "conversations": [ { "from": "human", "value": "\nHow far is matte blue shirt at upper left from camera?" }, { "from": "gpt", "value": "matte blue shirt at upper left and camera are 5.56 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a7d56512d61654a.jpg", "conversations": [ { "from": "human", "value": "\nIs black plastic sunglasses at upper right wider than clear plastic glasses at center?" }, { "from": "gpt", "value": "Incorrect, black plastic sunglasses at upper right's width does not surpass clear plastic glasses at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/908d29728ca3a105.jpg", "conversations": [ { "from": "human", "value": "\nYou are a soccer coach analyzing the field positions during a match. You notice the white smooth soccer player at center and the matte blue and red striped jersey at center. Which player is located closer to the ground?" }, { "from": "gpt", "value": "The white smooth soccer player at center is positioned under the matte blue and red striped jersey at center, so the white smooth soccer player at center is closer to the ground." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00b0f8f1b9b03936.jpg", "conversations": [ { "from": "human", "value": "\nYou are a soccer referee observing the field. You notice the white mesh netting at right and the green synthetic turf at center. Which object is positioned farther to the right side of the field?" }, { "from": "gpt", "value": "The white mesh netting at right is positioned farther to the right side of the field compared to the green synthetic turf at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93e8525f36f9df70.jpg", "conversations": [ { "from": "human", "value": "\nDoes dry grass at center appear under green leafy tree at left?" }, { "from": "gpt", "value": "Actually, dry grass at center is above green leafy tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06e17eca90acd43d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark blue coat at right is positioned below pink matte flowers at center?" }, { "from": "gpt", "value": "No, dark blue coat at right is not below pink matte flowers at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70b1c097d3146856.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of a photo of a man sitting on a red couch with a laptop and a ginger cat nearby. The photo has a specific point labeled as point (0.294, 0.684). If you want to touch that point on the photo, how far would you need to reach?" }, { "from": "gpt", "value": "The distance between point (0.294, 0.684) and the viewer is 34.44 inches, so you would need to reach 34.44 inches to touch that point on the photo." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/117facd40ff77cd9.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green fuzzy fern at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.764, 0.847)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/879b0a84d2dd935c.jpg", "conversations": [ { "from": "human", "value": "\nHow close is brown fuzzy duckling at center from brown fuzzy duckling at right?" }, { "from": "gpt", "value": "brown fuzzy duckling at center is 85.85 centimeters away from brown fuzzy duckling at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9be23238fcd72d3.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the canopy tent and want to greet both men wearing the white smooth dress shirt at right and the striped fabric shirt at center. Which man should you approach first if you want to greet the one closer to the entrance?" }, { "from": "gpt", "value": "The striped fabric shirt at center is closer to the entrance than the white smooth dress shirt at right, so you should approach the striped fabric shirt at center first." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/610583f2fd54b54d.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the transparent glass skyscraper at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.756, 0.252)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/520bec9e596d0eaf.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the camera position. You want to take a closeup shot of the knitted gray cardigan at center without moving the camera. Is it possible to do so with your current zoom level if your camera can zoom up to 2 meters?" }, { "from": "gpt", "value": "The knitted gray cardigan at center is 1.94 meters away from camera, so yes, you can take a closeup shot of the knitted gray cardigan at center without moving the camera since the distance is within the camera zoom range of 2 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0eea7c04a59cafc5.jpg", "conversations": [ { "from": "human", "value": "\nIs dark asphalt pavement at center above matte gray hoodie at center?" }, { "from": "gpt", "value": "Correct, dark asphalt pavement at center is located above matte gray hoodie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36075cf8976f0faa.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the brown smooth smoked gouda at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.864, 0.653)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e61453f9229d80e7.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.869, 0.419) or (0.040, 0.959)?" }, { "from": "gpt", "value": "Point (0.869, 0.419) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18e7b606ca1fe7eb.jpg", "conversations": [ { "from": "human", "value": "\nCould you measure the distance between brown leather jacket at lower center and light brown leather jacket at center?" }, { "from": "gpt", "value": "brown leather jacket at lower center and light brown leather jacket at center are 2.38 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b1e49b19e4f8423.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.444, 0.639) farther from viewer compared to point (0.955, 0.559)?" }, { "from": "gpt", "value": "No, (0.444, 0.639) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5a64b7effa5c87c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the base of the green leafy tree at upper center and want to walk to the nearest wooden post supporting the grapevines in the foreground. How far would you have to walk?" }, { "from": "gpt", "value": "The distance between the green leafy tree at upper center and the nearest wooden post supporting the grapevines in the foreground is 61.04 meters, so you would have to walk 61.04 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aeb4903ce4eab107.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.429, 0.662) come in front of point (0.818, 0.605)?" }, { "from": "gpt", "value": "Yes, point (0.429, 0.662) is in front of point (0.818, 0.605)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71abbfda00108334.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of black matte shirt at center in the image." }, { "from": "gpt", "value": "[(0.447, 0.762)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/608c9b106516c238.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery robot with a package that needs to be placed on the white plastic computer desk at center. You are currently positioned at the location of the striped sweater at center. Can you reach the desk without moving any objects?" }, { "from": "gpt", "value": "The distance between the striped sweater at center and the white plastic computer desk at center is 22.84 centimeters, so yes, the robot can reach the desk without moving any objects since the distance is manageable." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/562aee481844abd5.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.408, 0.261)?" }, { "from": "gpt", "value": "blue sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ceb39637816d90d6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position observing the sunset scene. There is a specific point marked at coordinates point (0.896, 0.800) in the image. How far is that point from you?" }, { "from": "gpt", "value": "The point (0.896, 0.800) is 11.75 meters away from the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f09f312ee7a920ad.jpg", "conversations": [ { "from": "human", "value": "\nYou are a construction worker standing at the base of the white smooth water tower at upper right. You need to place a safety barrier around it. The barrier requires a minimum distance of 80 meters from the tower to ensure safety. Can you determine if the current distance between you and the tower meets the safety requirement?" }, { "from": "gpt", "value": "The white smooth water tower at upper right is 82.37 meters away from the viewer, which exceeds the minimum required distance of 80 meters. Therefore, the current distance meets the safety requirement and the barrier can be placed accordingly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3995f7dc9681833a.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.229, 0.730)?" }, { "from": "gpt", "value": "white fluffy snow at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a948fc8ef1dc748.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.557, 0.197) and point (0.769, 0.247), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.769, 0.247) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/878d520ede4abb9f.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.731, 0.450) and point (0.581, 0.595), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.731, 0.450) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc5dcfad9d884620.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the green leafy plants at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.505, 0.748)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01a3ef09d9eda6c5.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green grass at lower center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.478, 0.878)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a2b5b148fd1dfb7.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of black matte helmet at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.948, 0.633)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ce2de546ceb8524.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark brown leather jacket at center is shorter than light brown cotton t-shirt at center?" }, { "from": "gpt", "value": "Yes, dark brown leather jacket at center is shorter than light brown cotton t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8f2df0820e33c8c.jpg", "conversations": [ { "from": "human", "value": "\nLocate the matte blue shirt at left in the image." }, { "from": "gpt", "value": "[(0.235, 0.625)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a4b34e5fd2ab6e9.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a photo shoot and need to decide which piece of clothing to feature first. Based on the image, which item is wider between the white floral dress at center and the brown beaded necklace at center?" }, { "from": "gpt", "value": "The white floral dress at center is wider than the brown beaded necklace at center according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b079f6b51541010f.jpg", "conversations": [ { "from": "human", "value": "\nYou are at a party and want to hand a drink to both the red cotton shirt at center and the pink fabric shirt at center. If you are standing at the edge of the dance floor, which person is farther away from you?" }, { "from": "gpt", "value": "The distance between the red cotton shirt at center and the pink fabric shirt at center is 6.74 feet. Since both are at the center of the scene, they are equidistant from your position at the edge of the dance floor. However, the exact distance from you to each would depend on your specific location, but their separation from each other is 6.74 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80bab2a4c04f0e6a.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the satin black car at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.161, 0.430)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec79850570292b78.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray rock at center bigger than green leafy bush at center?" }, { "from": "gpt", "value": "Actually, dark gray rock at center might be smaller than green leafy bush at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b00f3490601a9fc.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, matte gray uniform at center or wooden table at center, stands shorter?" }, { "from": "gpt", "value": "Standing shorter between the two is wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef6a990b541818f5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a visitor approaching the USDA building and notice the beige glass building at center and the green grass at lower center. Which object is closer to your viewpoint as you approach the entrance?" }, { "from": "gpt", "value": "The beige glass building at center is closer to your viewpoint because the green grass at lower center is positioned behind it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89353c1b69b41beb.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between transparent glass bottle at center and camera?" }, { "from": "gpt", "value": "transparent glass bottle at center and camera are 1.14 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76411e74f1d16d8f.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.676, 0.439) positioned in front of point (0.732, 0.867)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/355500d60d34607a.jpg", "conversations": [ { "from": "human", "value": "\nCould you measure the distance between black matte jacket at center and black matte jacket at lower left?" }, { "from": "gpt", "value": "black matte jacket at center and black matte jacket at lower left are 4.00 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87270c3c72aea308.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of gray fabric at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.721, 0.605)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1497076718049d7.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the two buildings and want to take a photo. You notice two points marked in the scene. Which point, point (0.284, 0.723) or point (0.097, 0.848), is closer to your camera lens?" }, { "from": "gpt", "value": "Point (0.284, 0.723) is further to the camera than point (0.097, 0.848), so the point closer to the camera lens is point (0.097, 0.848)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f0ff4ccff87ea5b.jpg", "conversations": [ { "from": "human", "value": "\nDoes bare branches at center have a smaller size compared to black wrought iron fence at lower center?" }, { "from": "gpt", "value": "Incorrect, bare branches at center is not smaller in size than black wrought iron fence at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1319be798c5be4d.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the brown rough stone at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.508, 0.823)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/634b1f525d704f81.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.532, 0.566) farther from camera compared to point (0.526, 0.800)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fef9922d3303bfcd.jpg", "conversations": [ { "from": "human", "value": "\nYou are navigating a drone over a wooded area and need to land it precisely on the rubberized blue raft at upper center. According to the coordinates provided, what are the exact coordinates where you should direct the drone to land?" }, { "from": "gpt", "value": "The rubberized blue raft at upper center is located at point (0.572, 0.194), so you should direct the drone to land there." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ab7dd141db46a6e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in front of the bench. You want to take a photo of the matte black dress at left and the blue cotton shirt at center so that both are fully visible in the frame. Given their height difference, which clothing item should you adjust your camera angle to focus on to ensure both are in focus?" }, { "from": "gpt", "value": "The matte black dress at left is taller than the blue cotton shirt at center. To ensure both are in focus, you should adjust your camera angle to focus on the matte black dress at left since it is taller and requires the camera to capture a wider vertical space." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a553169c56946327.jpg", "conversations": [ { "from": "human", "value": "\nWhere is metallic silver fork at lower left located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.125, 0.902)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3db4457af88c4886.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.560, 0.856) and camera." }, { "from": "gpt", "value": "The distance of point (0.560, 0.856) from camera is 44.36 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b347fa584395e73.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.444, 0.502) come closer to viewer compared to point (0.931, 0.608)?" }, { "from": "gpt", "value": "Yes, point (0.444, 0.502) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/421a4bf9d3cd93c8.jpg", "conversations": [ { "from": "human", "value": "\nLocate white matte shirt at center in the image." }, { "from": "gpt", "value": "[(0.334, 0.566)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3970ff5ba2e44d41.jpg", "conversations": [ { "from": "human", "value": "\nIs blue denim shirt at left thinner than brown hair at upper right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9232a00d15403f2d.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the waterway and want to place a small wooden sign between the green mossy bank at center and the green rough bark tree at upper left. Which object should you place the sign closer to if you want it to be more visible to someone approaching from the front?" }, { "from": "gpt", "value": "The green mossy bank at center is closer to the viewer than the green rough bark tree at upper left, so placing the sign closer to the green mossy bank at center would make it more visible to someone approaching from the front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/332a2833093d8cf8.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a blue matte charlie brown figure at center. Pinpoint a point to the blue matte charlie brown figure at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.739, 0.800)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/008a9370ee5a3bba.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black silk suit at center is positioned above blue striped tie at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/121fedf358e44ecd.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a charity event and need to display two items from the image. The display area has a width limit of 1 meter. Given that the matte gray coat at center and the floral print scarf at center must both be displayed, will their combined width exceed the limit?" }, { "from": "gpt", "value": "The matte gray coat at center is wider than the floral print scarf at center. However, without specific measurements, it is impossible to determine if their combined width exceeds 1 meter. Additional information about each item is needed to make an accurate assessment." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9a9e9f7be2507fb.jpg", "conversations": [ { "from": "human", "value": "\nYou are an event coordinator planning to set up a photo booth in this space. You need to ensure that the camouflage pants at lower left and the light beige skin at upper center are both visible in the booth photos. Based on their positions, which object should be placed closer to the camera to ensure both are in focus?" }, { "from": "gpt", "value": "The camouflage pants at lower left should be placed closer to the camera because it is located below the light beige skin at upper center, so adjusting their distance can help both be in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b395a38b70210e50.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.339, 0.542) or point (0.015, 0.806)?" }, { "from": "gpt", "value": "The point (0.015, 0.806) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea279bc6b8d0860e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if polished stone column at center is bigger than green leafy hedge at left?" }, { "from": "gpt", "value": "Actually, polished stone column at center might be smaller than green leafy hedge at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78cbafd33783f939.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.645, 0.478) or point (0.718, 0.895)?" }, { "from": "gpt", "value": "Point (0.645, 0.478)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef2b19848863a1d9.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.066, 0.627) or (0.463, 0.727)?" }, { "from": "gpt", "value": "The point (0.066, 0.627) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19b0587842aa9870.jpg", "conversations": [ { "from": "human", "value": "\nBetween shiny black car at center and glossy black car at center, which one is positioned higher?" }, { "from": "gpt", "value": "glossy black car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8752ff5ff654cfac.jpg", "conversations": [ { "from": "human", "value": "\nBetween green leafy shrub at center and brown rough rock at center, which one is positioned lower?" }, { "from": "gpt", "value": "brown rough rock at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cba127f8f5c51d2f.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the black chalkboard at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.742, 0.672)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5492fe1ee1987c20.jpg", "conversations": [ { "from": "human", "value": "\nDoes denim pants at lower center have a smaller size compared to light blue fabric pants at lower center?" }, { "from": "gpt", "value": "Actually, denim pants at lower center might be larger than light blue fabric pants at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10a94f4109b95a1d.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the wooden at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.565, 0.805)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63f61fa5370aab89.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of pink fabric shirt at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.367, 0.784)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6903f311609bf9f9.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.848, 0.562) more distant than point (0.673, 0.397)?" }, { "from": "gpt", "value": "No, (0.848, 0.562) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7abf38c685a89733.jpg", "conversations": [ { "from": "human", "value": "\nPoint to white matte golf club at center.Point to the white matte golf club at center in the image." }, { "from": "gpt", "value": "[(0.218, 0.295)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ba46169f5c3d706.jpg", "conversations": [ { "from": "human", "value": "\nIs leather boot at lower left below white soft fur paw at lower left?" }, { "from": "gpt", "value": "Yes, leather boot at lower left is below white soft fur paw at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b957054477ce4aa0.jpg", "conversations": [ { "from": "human", "value": "\nIs black and white striped shirt at center shorter than matte black sunglasses at center?" }, { "from": "gpt", "value": "Incorrect, black and white striped shirt at center's height does not fall short of matte black sunglasses at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07c8c6936f703a47.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte black tablet at center and matte red shirt at center, which one is positioned higher?" }, { "from": "gpt", "value": "matte black tablet at center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/673939b81117416c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a fashion designer analyzing the positioning of accessories in a professional setting. You notice the floral silk tie at center. Can you determine its exact coordinates in the image?" }, { "from": "gpt", "value": "The floral silk tie at center is positioned at coordinates point (0.436, 0.509)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4593605ba2f9cef6.jpg", "conversations": [ { "from": "human", "value": "\nIs red fabric kimono at left above dark gray suit at center?" }, { "from": "gpt", "value": "No, red fabric kimono at left is not above dark gray suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8073190badb7ae4.jpg", "conversations": [ { "from": "human", "value": "\nBased on the scene description, which object is taller between the white cotton shirt at center and the green matte shirt at right?" }, { "from": "gpt", "value": "The white cotton shirt at center is much taller than the green matte shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d98887816617c33.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.325, 0.603) and camera." }, { "from": "gpt", "value": "Point (0.325, 0.603) and camera are 35.25 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0621ee1c9823002a.jpg", "conversations": [ { "from": "human", "value": "\nHow far apart are red brick clock tower at center and brick red clock tower at center?" }, { "from": "gpt", "value": "They are 61.31 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37150909193d1c6a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a maintenance worker standing at the camera position. You need to retrieve the matte blue barrel at center left. Can you reach it without moving from your current position?" }, { "from": "gpt", "value": "The matte blue barrel at center left is 46.17 feet away from camera, so you cannot reach it without moving from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd0e2936909f0712.jpg", "conversations": [ { "from": "human", "value": "\nHow close is white plastic podium at center from red dotted fabric tie at center?" }, { "from": "gpt", "value": "The distance of white plastic podium at center from red dotted fabric tie at center is 13.51 inches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1bb008268c2659d.jpg", "conversations": [ { "from": "human", "value": "\nLocate all transparent glass car window at upper center in the image." }, { "from": "gpt", "value": "[(0.620, 0.253)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/def7c91353ec60df.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of matte black guitar at center in the image." }, { "from": "gpt", "value": "[(0.397, 0.523)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3595ec33dea5988.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.866, 0.400) or (0.487, 0.406)?" }, { "from": "gpt", "value": "The point (0.487, 0.406) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f4724a80073bfa8.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between gray fleece sweatshirt at center and matte black blazer at center." }, { "from": "gpt", "value": "gray fleece sweatshirt at center is 1.03 meters from matte black blazer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/daf7708cea5c8a3d.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy round table at center to the left of wooden bookshelf at left from the viewer's perspective?" }, { "from": "gpt", "value": "In fact, white glossy round table at center is to the right of wooden bookshelf at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/452a3682d320d7a9.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny red coat at center to the right of matte black jacket at left from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, shiny red coat at center is positioned on the right side of matte black jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35a1eb0c3dbba882.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.362, 0.739) or (0.679, 0.348)?" }, { "from": "gpt", "value": "The point (0.679, 0.348) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/946abb40d8ae6fcc.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.469, 0.450) positioned behind point (0.188, 0.467)?" }, { "from": "gpt", "value": "No, (0.469, 0.450) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7422215105a33986.jpg", "conversations": [ { "from": "human", "value": "\nHow far is brown stone tower at center from camera?" }, { "from": "gpt", "value": "brown stone tower at center and camera are 34.57 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0f82d50e14f9942.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point marked at coordinates (0.149, 0.683). How far do you need to walk to get there?" }, { "from": "gpt", "value": "The point marked at coordinates (0.149, 0.683) is 6.25 meters away from the camera, so you need to walk 6.25 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e7ca3498894582d.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.137, 0.344) come farther from viewer compared to point (0.747, 0.670)?" }, { "from": "gpt", "value": "Yes, point (0.137, 0.344) is farther from viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90e1346f74e75434.jpg", "conversations": [ { "from": "human", "value": "\nIs bronze statue at center smaller than light brown wooden bench at center?" }, { "from": "gpt", "value": "Indeed, bronze statue at center has a smaller size compared to light brown wooden bench at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3dad26e58e17726.jpg", "conversations": [ { "from": "human", "value": "\nBetween gray gravel at center and metallic silver motorcycle at center, which one has less height?" }, { "from": "gpt", "value": "With less height is gray gravel at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdc36b304c0d5953.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.463, 0.283) lie in front of point (0.263, 0.755)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61acbae188b95734.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if denim jeans at lower left is shorter than black matte hair at lower right?" }, { "from": "gpt", "value": "No, denim jeans at lower left is not shorter than black matte hair at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abb178bf88c37bd9.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte yellow dress at center and light blue fabric dress at lower right, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, light blue fabric dress at lower right appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1440d1d1282403ce.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the crab preparation area and need to pick up an object. Which of the two points, point (0.917, 0.031) or point (0.838, 0.077), is closer to you?" }, { "from": "gpt", "value": "Point (0.917, 0.031) is closer to the camera than point (0.838, 0.077), so it is closer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c068513b7a88706.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the edge of the field. You want to take a photo that includes both the red matte jersey at center and the black smooth shirt at center. Which one will appear larger in the photo?" }, { "from": "gpt", "value": "The red matte jersey at center will appear larger in the photo because it is closer to the viewer than the black smooth shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8905f82911371c12.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian standing at the center of the street facing the building. You see a shiny black car at lower right and a metallic silver car at lower left. Which car is closer to your right side?" }, { "from": "gpt", "value": "The shiny black car at lower right is closer to your right side because it is positioned to the right of the metallic silver car at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8769d4964817fd23.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the striped cotton shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.547, 0.609)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4dde91b10a612c20.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tourist standing in front of the Torre de Belm and want to take a photo that includes both the stone tower at center and the reflective silver water at lower center. Based on their positions, which object should appear closer to the camera in your photo?" }, { "from": "gpt", "value": "The stone tower at center is further to the viewer than reflective silver water at lower center, so the stone tower at center will appear closer to the camera in the photo." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f480aa97152205d2.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of white concrete pavement at center in the image." }, { "from": "gpt", "value": "[(0.421, 0.780)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3af95f8dceaedabd.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, white frosted glass at upper left or light green fabric at upper right?" }, { "from": "gpt", "value": "Positioned lower is light green fabric at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/008dbf80243141f6.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.785, 0.441) positioned before point (0.320, 0.261)?" }, { "from": "gpt", "value": "No, (0.785, 0.441) is behind (0.320, 0.261)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c82bb94e6cab21bb.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the celebratory scene. The scene has a point marked at coordinates point (0.671, 0.561). Can you describe what is located at that point?" }, { "from": "gpt", "value": "The point (0.671, 0.561) indicates the location of the matte red shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb14e32456a1bb72.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown leather jacket at center to the right of blue cotton shirt at center from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, dark brown leather jacket at center is positioned on the right side of blue cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/859e8cb2f60806f7.jpg", "conversations": [ { "from": "human", "value": "\nIs clear water at center smaller than blue fabric kayak at center?" }, { "from": "gpt", "value": "Actually, clear water at center might be larger than blue fabric kayak at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/885aa3dd88a4d027.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the banner and the jacket in the scene. Given that the white paper banner at center is narrower than the dark brown leather jacket at center, which object would you need to position closer to the camera to ensure both fill the frame equally?" }, { "from": "gpt", "value": "Since the white paper banner at center is narrower than the dark brown leather jacket at center, you would need to position the white paper banner at center closer to the camera to ensure both fill the frame equally." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b6456e0f025a2be.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between gray striped blouse at center and camera." }, { "from": "gpt", "value": "1.12 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d6e185aaebbe031.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black netting at upper right appear over matte black face at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d722fe6ff47b616b.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a pink fabric at center. Pinpoint a point to the pink fabric at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.431, 0.895)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/038c0e49c3c925cd.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte christmas tree at center appear over white cotton shirt at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17c6a35c83f2812e.jpg", "conversations": [ { "from": "human", "value": "\nIs floral bouquet at center to the right of smooth plastic vase at center from the viewer's perspective?" }, { "from": "gpt", "value": "In fact, floral bouquet at center is to the left of smooth plastic vase at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8eca7ebd3354fd85.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow matte jacket at center have a lesser height compared to white earphone at left?" }, { "from": "gpt", "value": "No, yellow matte jacket at center is not shorter than white earphone at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d40135c2268fd2a9.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black jacket at left have a lesser height compared to dark gray suit at center?" }, { "from": "gpt", "value": "Indeed, matte black jacket at left has a lesser height compared to dark gray suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7ffc723443a935e.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the glossy glass tower at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.579, 0.577)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37f67733fa4a861a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper right is taller than brown wooden table at center?" }, { "from": "gpt", "value": "Correct, green leafy tree at upper right is much taller as brown wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0adccb1296a9bda0.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, brown matte t-shirt at center or black matte shirt at center?" }, { "from": "gpt", "value": "Positioned to the left is brown matte t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5dc40f24ba2894cc.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.429, 0.642) or point (0.633, 0.914)?" }, { "from": "gpt", "value": "The point (0.429, 0.642) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a006176b716b98c5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray water at lower left is positioned to the right of yellow wood beach hut at center?" }, { "from": "gpt", "value": "In fact, gray water at lower left is to the left of yellow wood beach hut at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2e1cffc4009ab1a.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.370, 0.547) behind point (0.667, 0.505)?" }, { "from": "gpt", "value": "No, (0.370, 0.547) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06350cec9de44bea.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.128, 0.558) come behind point (0.369, 0.500)?" }, { "from": "gpt", "value": "No, it is in front of (0.369, 0.500)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6fa4a3de52c06ed.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the reddish-brown leather jacket at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.401, 0.470)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/554b7ab0f3e1cce4.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to pink smooth eyebrow at upper center? Please provide its 2D coordinates.Where can I find pink smooth eyebrow at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.658, 0.448)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ae4a8d91ecec639.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any green matte coconuts at upper right in the image." }, { "from": "gpt", "value": "[(0.742, 0.514)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14cd7e43e76451cb.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the plaid fabric shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.621, 0.714)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a5c4c2502782fa9.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of yellow matte tray at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.408, 0.533)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d4350f51c238ff3.jpg", "conversations": [ { "from": "human", "value": "\nPoint to white glossy sports car at left.Point to the white glossy sports car at left in the image." }, { "from": "gpt", "value": "[(0.309, 0.597)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34145b6140aa0487.jpg", "conversations": [ { "from": "human", "value": "\nIs pink fabric dress at left in front of velvet dark blue rocking chair at right?" }, { "from": "gpt", "value": "Yes, it is in front of velvet dark blue rocking chair at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed6ef440c9bb3650.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth dark wood dock at lower right is smaller than shiny silver boat at center?" }, { "from": "gpt", "value": "No, smooth dark wood dock at lower right is not smaller than shiny silver boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/528d60e55fcf49b1.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white cotton cap at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.732, 0.388)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00f106127d8321ca.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of white glossy bowl at lower right more distant than that of white glossy bowl at lower center?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/126d01c6b2c63e49.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of black fabric person at right?" }, { "from": "gpt", "value": "18.15 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7d03a4d5fbd38a1.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.666, 0.688) to camera." }, { "from": "gpt", "value": "Point (0.666, 0.688) and camera are 10.16 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d5dab1d3852319c.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.480, 0.100) positioned in front of point (0.922, 0.212)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed4796764c2d32d7.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.789, 0.942) and point (0.115, 0.491), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.789, 0.942) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b17a0f34f2541db.jpg", "conversations": [ { "from": "human", "value": "\nLocate all green matte shirt at left in the image." }, { "from": "gpt", "value": "[(0.184, 0.588)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04b3145dcb20095f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a visitor approaching the building and see the smooth concrete at center and the dark blue fabric at lower left. Which object is positioned to the right side from your perspective?" }, { "from": "gpt", "value": "The smooth concrete at center is positioned to the right of the dark blue fabric at lower left, so the smooth concrete at center is on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2696fd25d6766319.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, matte black neck at center or green fabric lanyard at center?" }, { "from": "gpt", "value": "green fabric lanyard at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41661cd69108545c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, glistening silver water at center or white glossy boat at center?" }, { "from": "gpt", "value": "Positioned to the right is white glossy boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b59901c739016b81.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dry grass at center is taller than green leafy tree at center?" }, { "from": "gpt", "value": "Incorrect, dry grass at center's height is not larger of green leafy tree at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77b503cec1a1bc42.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue water at center lie behind yellow metallic crane at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cdceb8e25508856.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of plaid fabric shirt at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.171, 0.698)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46411669299e5366.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green leafy tree at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.228, 0.073)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcf4a4c1d90d2fcc.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the white marble statue at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.385, 0.231)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7721485f0b1e7b3a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray asphalt race track at center is bigger than sleek silver/silver metallic sports car at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b639f17d87401207.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the Museo del Agrarismo Mexicano and want to read the black leather plaque at center. How far do you need to walk to reach it?" }, { "from": "gpt", "value": "The black leather plaque at center is 3.92 meters away from the viewer, so you need to walk 3.92 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9ba572ac63cf704.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.875, 0.528) less distant than point (0.939, 0.500)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.939, 0.500)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1a137b95428fccc.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked by the coordinates (0.473, 0.791) in the image. What object are you directly in front of?" }, { "from": "gpt", "value": "The point (0.473, 0.791) corresponds to the green leafy tree at center, so you are directly in front of the green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b291b7b4f2b8b843.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the brown dry grass at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.506, 0.684)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0de7c4521782a7a5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black adidas tracksuit at center is positioned to the right of matte black tracksuit at center?" }, { "from": "gpt", "value": "Indeed, black adidas tracksuit at center is positioned on the right side of matte black tracksuit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd0b39b76dbd6179.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the rusty metal roof at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.136, 0.525)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84bcf8c5427bca4d.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the striped fabric top at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.324, 0.683)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d5a0171fa04ef09.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of pink matte building at center from camera?" }, { "from": "gpt", "value": "They are 102.19 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a756724a2a0902a5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer positioned at the runway end. You need to capture a photo that includes both the black satin dress at center and the matte black dress at center. Given that your camera has a maximum focus range of 3 meters, will you be able to capture both dresses in focus?" }, { "from": "gpt", "value": "The black satin dress at center is 3.81 meters away from the matte black dress at center. Since the distance between them exceeds the camera maximum focus range of 3 meters, the camera cannot focus on both dresses simultaneously." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30c761f7f096b82a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a passenger in the backseat of the car and want to know which vehicle is taller between the blue matte car at right and the white matte sedan at center. Can you determine this based on the view from your seat?" }, { "from": "gpt", "value": "The blue matte car at right is taller than the white matte sedan at center according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98bfe6b3a417677d.jpg", "conversations": [ { "from": "human", "value": "\nLocate all white satin dress at center in the image." }, { "from": "gpt", "value": "[(0.728, 0.681)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00cbaa47dea08fdb.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of concrete pavement at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.636, 0.867)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77c87a7b9408599e.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.576, 0.553) to camera." }, { "from": "gpt", "value": "Point (0.576, 0.553) and camera are 2.73 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74d7853f5fd90d35.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to deliver a package to the woman in the scene. You see the pink fabric tank top at center and the brown wooden rake at center. Which object is closer to the left side of the scene?" }, { "from": "gpt", "value": "The pink fabric tank top at center is to the left of the brown wooden rake at center, so it is closer to the left side of the scene." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/800d97dd8caa96c1.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the sequined purple dress at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.671, 0.555)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c8f02dd10ee62a9.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.360, 0.573) or point (0.686, 0.527)?" }, { "from": "gpt", "value": "The point (0.686, 0.527) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c633061c0ddf037.jpg", "conversations": [ { "from": "human", "value": "\nYou are setting up a video call and need to adjust the camera position so that both the matte black monitor at center and the beige fabric face at center are visible. Based on their positions, which object should you move closer to the left side to achieve this?" }, { "from": "gpt", "value": "The beige fabric face at center should be moved closer to the left side because the matte black monitor at center is already positioned to its right. By moving the beige fabric face to the left, both objects will be aligned within the camera frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ac6f9a6d11c8e2d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to park your white matte van at lower center near the building. There is another white matte van at center already parked. Which van is shorter and can fit into a tighter parking spot?" }, { "from": "gpt", "value": "The white matte van at lower center is shorter than the white matte van at center, so it can fit into a tighter parking spot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4563fce9d74fd55c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white matte ambulance at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.449, 0.569)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b13f86672fd6987.jpg", "conversations": [ { "from": "human", "value": "\nBetween black fleece jacket at center and light blue quilted jacket at center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, black fleece jacket at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b9ab8aefd02b700.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.766, 0.717)?" }, { "from": "gpt", "value": "The distance of point (0.766, 0.717) from camera is 3.39 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4c5ad31a9be2e7a.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.518, 0.853)." }, { "from": "gpt", "value": "light blue shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/732d3d301674feb6.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, green leafy palm tree at left or blue jeans at lower right?" }, { "from": "gpt", "value": "Standing shorter between the two is blue jeans at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd7abc88d8582de5.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.845, 0.867) come behind point (0.331, 0.795)?" }, { "from": "gpt", "value": "No, (0.845, 0.867) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/601a8f1e52950e72.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.292, 0.947) and camera." }, { "from": "gpt", "value": "Point (0.292, 0.947) is 6.36 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3deb5a40b3f5e91e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.641, 0.730) or point (0.315, 0.272)?" }, { "from": "gpt", "value": "The point (0.315, 0.272) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16b30baa1e16e202.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.649, 0.838)?" }, { "from": "gpt", "value": "blue metal fence at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b51c6ba0a8e2708d.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black metal clock at upper center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.538, 0.297)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c628077f80f89d5.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of blue liquid water at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.901, 0.517)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b2b16207febcfc0.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.282, 0.361) behind point (0.920, 0.648)?" }, { "from": "gpt", "value": "Yes, point (0.282, 0.361) is behind point (0.920, 0.648)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4be1ac49b6de9e2b.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown wooden table at center appear on the right side of dark brown wooden cross at center?" }, { "from": "gpt", "value": "Indeed, dark brown wooden table at center is positioned on the right side of dark brown wooden cross at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60ea3ca1b7803afd.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.163, 0.509)?" }, { "from": "gpt", "value": "white apron at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41fd34e804d83a8f.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.198, 0.948) or (0.732, 0.838)?" }, { "from": "gpt", "value": "Point (0.732, 0.838)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fb25e72a6da1dcf.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer planning to take a picture of the shrine. You notice two shirts hanging on a rack near the entrance. The shirts are the blue printed shirt at lower center and the blue plaid shirt at center. Which shirt should you avoid including in your photo to ensure the shrine remains the main focus, considering their positions?" }, { "from": "gpt", "value": "The blue printed shirt at lower center is shorter than the blue plaid shirt at center. Since the shorter shirt might be less likely to obstruct the shrine, you should avoid including the taller blue plaid shirt at center to keep the shrine as the main focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f67d6281117c88a.jpg", "conversations": [ { "from": "human", "value": "\nYou are trying to locate the dark gray suit at center in the image. What are its coordinates?" }, { "from": "gpt", "value": "The coordinates of the dark gray suit at center are at point (0.683, 0.694)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5904597d19096d5e.jpg", "conversations": [ { "from": "human", "value": "\nDoes white plastic table at center have a lesser height compared to metallic silver stool at lower right?" }, { "from": "gpt", "value": "No, white plastic table at center is not shorter than metallic silver stool at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0030ba341a7c4b55.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to white glossy canoe at center? Please provide its 2D coordinates.Where can I find white glossy canoe at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.290, 0.558)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02e7b2e154e4c458.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of clear glass water at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.334, 0.744)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c35c4a921993ec68.jpg", "conversations": [ { "from": "human", "value": "\nHow close is matte blue mesh top at center from camera?" }, { "from": "gpt", "value": "matte blue mesh top at center and camera are 4.77 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2f155881c90be32.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.777, 0.459) positioned before point (0.347, 0.414)?" }, { "from": "gpt", "value": "Yes, point (0.777, 0.459) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c98c17ec6aa8c272.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.019, 0.261) or point (0.237, 0.494)?" }, { "from": "gpt", "value": "Point (0.019, 0.261)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97b51113dea4b671.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing 16.96 inches away from the point at coordinates point (0.054, 0.353). If you want to place a small pebble there, will you be able to do so without moving your current position?" }, { "from": "gpt", "value": "Yes, because the distance between you and point (0.054, 0.353) is exactly 16.96 inches, so you can reach it from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b729239eb9d1c92.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the matte yellow sweater at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.681, 0.427)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0aaaab282091c80d.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, green leafy tree at center or muddy water at center?" }, { "from": "gpt", "value": "muddy water at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/349bad5723476441.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of transparent glass bottle at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.505, 0.709)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f3da25af1c2eaac.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of multicolored woven vase at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.228, 0.458)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1df88ef161b76eb.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.425, 0.711) or point (0.319, 0.544)?" }, { "from": "gpt", "value": "Positioned in front is point (0.425, 0.711)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8456b00c93d504b0.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between stone steps at center and green leafy tree at upper center?" }, { "from": "gpt", "value": "4.32 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8624585ab31be770.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.349, 0.388) farther from viewer compared to point (0.503, 0.247)?" }, { "from": "gpt", "value": "No, (0.349, 0.388) is in front of (0.503, 0.247)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d3c624dd4f4be00.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point marked as point (0.824, 0.792). How far do you need to walk to get there?" }, { "from": "gpt", "value": "The point (0.824, 0.792) is 83.42 meters away from the camera, so you need to walk 83.42 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58b9029584651f77.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte jacket at center is bigger than black matte video camera at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1255a0c2ceb44e6b.jpg", "conversations": [ { "from": "human", "value": "\nDoes red fabric jacket at center have a lesser width compared to light brown leather jacket at center?" }, { "from": "gpt", "value": "Incorrect, red fabric jacket at center's width is not less than light brown leather jacket at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a026da5483f91dab.jpg", "conversations": [ { "from": "human", "value": "\nBetween gray stone face at center and gray stone statue at center, which one has more height?" }, { "from": "gpt", "value": "gray stone statue at center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ab18808b9bd99be.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of black asphalt highway at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.485, 0.795)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/785b4be2484ed843.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, black fabric dress at lower right or white cotton shirt at center?" }, { "from": "gpt", "value": "Positioned to the left is white cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c783ef50335be8a.jpg", "conversations": [ { "from": "human", "value": "\nIs gray cotton shirt at center bigger than dark gray suit at center?" }, { "from": "gpt", "value": "Incorrect, gray cotton shirt at center is not larger than dark gray suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80c0cddbbacbaa3b.jpg", "conversations": [ { "from": "human", "value": "\nYou are trying to determine the exact position of the black leather shoe at center in the image. What are the coordinates of its location?" }, { "from": "gpt", "value": "The coordinates of the black leather shoe at center are at point (0.561, 0.867)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a6932ae45b066da.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.598, 0.605) less distant than point (0.382, 0.273)?" }, { "from": "gpt", "value": "Yes, point (0.598, 0.605) is in front of point (0.382, 0.273)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b66006e1a895353.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.322, 0.384) or (0.492, 0.422)?" }, { "from": "gpt", "value": "Positioned in front is point (0.492, 0.422)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3ea88c5f020ee45.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.728, 0.147) and point (0.066, 0.436), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.066, 0.436)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c139f3d30490f27.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer using a camera with a minimum focusing distance of 12 inches. You want to take a closeup shot of the blue glossy eye at center. Can you focus on it without moving the camera closer?" }, { "from": "gpt", "value": "The blue glossy eye at center is 13.35 inches away from camera, which is beyond the camera minimum focusing distance of 12 inches. Therefore, the camera can focus on the blue glossy eye at center without needing to move closer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef5491ddf0eaeb46.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.866, 0.670) from camera?" }, { "from": "gpt", "value": "5.63 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9691b2144fdca88e.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown fabric uniform at center have a larger size compared to white cotton shirt at upper right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04ece8903a62470e.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of matte black cycling outfit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.567, 0.531)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8a4d39df77d6816.jpg", "conversations": [ { "from": "human", "value": "\nIs floral printed fabric at lower center thinner than matte pink shirt at center?" }, { "from": "gpt", "value": "No, floral printed fabric at lower center is not thinner than matte pink shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72f5df15682a545f.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.216, 0.650) come in front of point (0.631, 0.438)?" }, { "from": "gpt", "value": "No, it is behind (0.631, 0.438)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17b783ed27154932.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the industrial area depicted in the scene. You need to reach a specific point marked as point (0.735, 0.658). How far is this point from your current position?" }, { "from": "gpt", "value": "The point (0.735, 0.658) is 6.05 meters away from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29d28a1214596be4.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of brushed metal rail at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.229, 0.744)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20854ed02cd2fb27.jpg", "conversations": [ { "from": "human", "value": "\nYou are a parent watching your child play in the ball pit. Your child, the white matte baby at center, wants to reach the yellow matte ball at center. Can they grab it without moving their position?" }, { "from": "gpt", "value": "The white matte baby at center is 24.50 inches away from the yellow matte ball at center. Since the distance is too far for a baby to reach without moving, they cannot grab it without adjusting their position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90e20f0ff2e96585.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.240, 0.486) and point (0.854, 0.553), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.854, 0.553)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0f1ee9444e5f652.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to adjust the lighting for a photo shoot. You notice the matte black sunglasses at upper center and the black matte dress at center. Which object is located to the right of the other?" }, { "from": "gpt", "value": "The matte black sunglasses at upper center is positioned on the right side of black matte dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d41395043a075c6b.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green leafy bush at right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.823, 0.188)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c621f47a987f2c7.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green grass at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.486, 0.845)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/997ab4752ba66279.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.573, 0.537) and point (0.436, 0.567), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.436, 0.567)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6fc7e483e6e27d5.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the matte purple shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.439, 0.525)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ccf6131c5212e0b9.jpg", "conversations": [ { "from": "human", "value": "\nHow far is metallic gray roof at lower left from camera?" }, { "from": "gpt", "value": "The distance of metallic gray roof at lower left from camera is 17.55 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3a156e22bacd0c2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grassy hillside at left is smaller than greenish-blue water at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcb8bd34ced1562a.jpg", "conversations": [ { "from": "human", "value": "\nYou are driving and need to check your blind spot. You look at the clear glass mirror at center and the asphalt road at center. Which one takes up more space in your view?" }, { "from": "gpt", "value": "The asphalt road at center takes up more space in your view because the clear glass mirror at center occupies less space than asphalt road at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3d8fb3da4d8f029.jpg", "conversations": [ { "from": "human", "value": "\nYou are attending a panel discussion at Campus Party and notice two attendees wearing a matte gray suit at center and a black hoodie at center. Which one is positioned to the right?" }, { "from": "gpt", "value": "The matte gray suit at center is positioned to the right of the black hoodie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a0d687aa53ae82b.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, yellow fabric safety vest at center or navy blue fabric baseball cap at upper left?" }, { "from": "gpt", "value": "yellow fabric safety vest at center is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d21541a3cb86e721.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.582, 0.294) come farther from viewer compared to point (0.746, 0.019)?" }, { "from": "gpt", "value": "No, (0.582, 0.294) is in front of (0.746, 0.019)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35d8d0da23154d27.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, white checkered shirt at center or red and white striped shirt at center, stands shorter?" }, { "from": "gpt", "value": "With less height is red and white striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab4ab6f0504c8eaf.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from purple glossy electric guitar at center to camera." }, { "from": "gpt", "value": "They are 3.56 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/191a6a0cdfe6c15e.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the silver metallic laptop at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.442, 0.820)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c039e1105e7df4ff.jpg", "conversations": [ { "from": "human", "value": "\nBetween beige fabric couch at left and yellow t-shirt at center, which one has less height?" }, { "from": "gpt", "value": "yellow t-shirt at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2780407fad4c68f6.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the brown leather jacket at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.313, 0.531)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f81f0d657ce60c57.jpg", "conversations": [ { "from": "human", "value": "\nWhat is located at the coordinates point (0.310, 0.830) in the image?" }, { "from": "gpt", "value": "The shiny black laptop at lower left is located at point (0.310, 0.830)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6fb33178ed887bfa.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.533, 0.678) and camera?" }, { "from": "gpt", "value": "Point (0.533, 0.678) and camera are 26.06 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4192d9a5f60d6dc1.jpg", "conversations": [ { "from": "human", "value": "\nIs multicolored painted pavilion at center smaller than blue denim jacket at lower right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86dfb0b2a54a7086.jpg", "conversations": [ { "from": "human", "value": "\nYou are sitting at the platform and want to place your phone on the metallic textured table at center and the white matte mug at center. Which object should you place it on to keep it closer to the edge of the platform?" }, { "from": "gpt", "value": "You should place your phone on the metallic textured table at center because it is to the right of the white matte mug at center, and since the platform edge is on the right side, it would be closer to the edge." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d177f58ba367d1d8.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance from white metal rail at upper center to golden textured horse at center." }, { "from": "gpt", "value": "34.21 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a065a7fcbd9f071.jpg", "conversations": [ { "from": "human", "value": "\nWhat object is located at the coordinates point (0.229, 0.630)?" }, { "from": "gpt", "value": "The dark gray suit at left is located at point (0.229, 0.630)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5751c4ae4f4eef6.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.267, 0.286) and point (0.218, 0.775), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.218, 0.775)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fa2f1b27b908466.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from rusty metal cannon at lower left to rusty metal cannon at center." }, { "from": "gpt", "value": "rusty metal cannon at lower left is 2.48 meters away from rusty metal cannon at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04473542199a6df4.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect analyzing the building structure. You need to determine which object occupies more horizontal space in the image between the brown tiled tower at center and the metallic silver clock at center. Which one is wider?" }, { "from": "gpt", "value": "The brown tiled tower at center is wider than the metallic silver clock at center according to the description provided." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2e802e3ae0c3990.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.624, 0.684) come farther from viewer compared to point (0.564, 0.066)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.564, 0.066)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/006a75064ece9cfb.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tourist visiting the Leaning Tower of Pisa and notice both the white stone tower at center and the striped sweater at center in the scene. From your vantage point, which object is closer to you?" }, { "from": "gpt", "value": "The white stone tower at center is closer to you because the striped sweater at center is behind it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/863c9347172e7e43.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.919, 0.933) lie behind point (0.467, 0.522)?" }, { "from": "gpt", "value": "Yes, point (0.919, 0.933) is behind point (0.467, 0.522)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbc23792cc2a70f3.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of gravel at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.517, 0.892)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bd2ceb111b06b59.jpg", "conversations": [ { "from": "human", "value": "\nIs light gray fabric bicycle at center taller than shiny black car at lower right?" }, { "from": "gpt", "value": "Correct, light gray fabric bicycle at center is much taller as shiny black car at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/151d3b3369963608.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the patio and want to place a small potted plant between the black matte tank top at center and the wooden table at center. Which object should the plant be closer to based on their positions?" }, { "from": "gpt", "value": "The plant should be placed closer to the wooden table at center because the black matte tank top at center is closer to the viewer than the wooden table at center, so the distance between them requires the plant to be near the farther object to maintain balance." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd78e2987ed1f8da.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.404, 0.678) or point (0.803, 0.484)?" }, { "from": "gpt", "value": "Positioned behind is point (0.803, 0.484)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/350f38203c4d3135.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of printed cotton shorts at center in the image." }, { "from": "gpt", "value": "[(0.742, 0.731)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/598bb1f12498e1cd.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.754, 0.375) less distant than point (0.406, 0.584)?" }, { "from": "gpt", "value": "No, (0.754, 0.375) is further to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbd26d2b135976b7.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green leafy tree at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.781, 0.298)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ce96b161068f6e2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth concrete at lower left is positioned below white cotton shirt at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05e9fd3217ca3657.jpg", "conversations": [ { "from": "human", "value": "\nPoint to concrete bridge at center.Point to the concrete bridge at center in the image." }, { "from": "gpt", "value": "[(0.785, 0.467)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00141962b7815d54.jpg", "conversations": [ { "from": "human", "value": "\nYou are a safety officer at the shooting range. You notice two people in the scene. One is wearing a camouflage uniform at left, and the other is wearing a navy blue fabric jacket at center. According to safety protocols, all participants must be at least 2 meters apart. Can you determine if they are complying with this rule based on their positions?" }, { "from": "gpt", "value": "The camouflage uniform at left is to the left of the navy blue fabric jacket at center, but the distance between them isn not specified in the objects description. Therefore, it is impossible to determine if they are complying with the 2 meters apart rule based on the given information." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0ef1a488e2e5ef1.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of blue sweatshirt at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.844, 0.597)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c17186f5ed79bce6.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of green helmeted man at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.452, 0.511)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/056757c237c2bfdc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green glossy duck at center is positioned above brown speckled duck at center?" }, { "from": "gpt", "value": "Incorrect, green glossy duck at center is not positioned above brown speckled duck at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/646f27c164746457.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, matte gray shoe at center or white cotton sock at center?" }, { "from": "gpt", "value": "With more height is matte gray shoe at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6707989e1f64dddd.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.525, 0.778)?" }, { "from": "gpt", "value": "gray ribbed paddleboard at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b72ce234eaf05b31.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of bumpy beige rock at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.617, 0.613)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac0d55f9826ab858.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to concrete steps at lower center? Please provide its 2D coordinates.Where can I find concrete steps at lower center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.530, 0.869)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1b7057d84f2b5ab.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte black laptop at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.398, 0.498)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de3380381f2bf394.jpg", "conversations": [ { "from": "human", "value": "\nBetween bare branches at upper right and smooth brown tower at center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "Positioned to the left is smooth brown tower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d5490bdc1de95db.jpg", "conversations": [ { "from": "human", "value": "\nLocate all matte white sign at center in the image." }, { "from": "gpt", "value": "[(0.183, 0.605)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/312d39c24de6d7dd.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink matte apple at lower left come behind yellow-green matte apple at center-right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13459baf6524c0e9.jpg", "conversations": [ { "from": "human", "value": "\nLocate dark brown leather jacket at center in the image." }, { "from": "gpt", "value": "[(0.669, 0.700)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4929b816abc67bd6.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny metallic dress at center wider than leopard print dress at center?" }, { "from": "gpt", "value": "Indeed, shiny metallic dress at center has a greater width compared to leopard print dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5490bb31e7666b0.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte tray at center appear over sesame seed bun at center?" }, { "from": "gpt", "value": "Indeed, green matte tray at center is positioned over sesame seed bun at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb1b7eef182f8151.jpg", "conversations": [ { "from": "human", "value": "\nBetween brown/mountainous at upper center and clear water at lower left, which one has less height?" }, { "from": "gpt", "value": "clear water at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cfddb5b9e2b95f6.jpg", "conversations": [ { "from": "human", "value": "\nIs white powdery snow at center positioned at the back of green plastic picnic table at center?" }, { "from": "gpt", "value": "No, white powdery snow at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df018b2a431d2570.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the brown fabric jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.728, 0.681)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7761092fa8b6567a.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver chain-link fence at left lie behind blue painted wood at upper center?" }, { "from": "gpt", "value": "No, silver chain-link fence at left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/859507f901774cdd.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the black rubber car at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.950, 0.713)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdbd01b8a2dbae50.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of matte black tank top at upper right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.888, 0.650)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2185b2fadcc0b081.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.399, 0.814) come in front of point (0.580, 0.306)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.580, 0.306)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77ac688cdc4cfd53.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, blue plastic stool at lower center or white glossy taxi at center?" }, { "from": "gpt", "value": "blue plastic stool at lower center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64eed520b043f25d.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the plaid cotton shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.751, 0.747)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff6ef633122c1365.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a detailed shot of the multicolored sheer scarf at center and the blue satin headscarf at center. Which one is positioned closer to the camera?" }, { "from": "gpt", "value": "The multicolored sheer scarf at center is positioned closer to the camera than the blue satin headscarf at center because it is in front of it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29d30134f3c0836b.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between light gray jacket at center and camera?" }, { "from": "gpt", "value": "A distance of 5.14 feet exists between light gray jacket at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/968bd1aa155e1b5b.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, white glossy necklace at upper center or matte white shirt at center?" }, { "from": "gpt", "value": "white glossy necklace at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48288c1cdf31b7cc.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of printed fabric dress at center from camera?" }, { "from": "gpt", "value": "The distance of printed fabric dress at center from camera is 1.51 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c095fd72f2dddcec.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, black matte jacket at center or light blue and white jacket at center?" }, { "from": "gpt", "value": "Positioned higher is light blue and white jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aed1e83071004028.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black textured blazer at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.342, 0.606)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ea0dc0eac74174d.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of blue matte jersey at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.349, 0.444)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7036f0e312acf291.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the pink fleece jacket at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.258, 0.739)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53a8e02d420482b6.jpg", "conversations": [ { "from": "human", "value": "\nDoes white paper at upper center have a lesser height compared to wooden podium at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfdb768640fc1c7e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, wooden beam at center or brown concrete beam at upper center?" }, { "from": "gpt", "value": "wooden beam at center is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1753d67d1d10495b.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy car at center appear on the left side of red matte jacket at center?" }, { "from": "gpt", "value": "Correct, you'll find white glossy car at center to the left of red matte jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67e240cb31c52691.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between smooth blonde hair at center and camera." }, { "from": "gpt", "value": "smooth blonde hair at center is 3.93 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7253fd4ff340154.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.819, 0.519)?" }, { "from": "gpt", "value": "white bark tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/727c4e25691d7728.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.284, 0.880) and camera?" }, { "from": "gpt", "value": "The distance of point (0.284, 0.880) from camera is 3.52 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfd75f815389af2c.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.161, 0.980) come farther from viewer compared to point (0.802, 0.478)?" }, { "from": "gpt", "value": "No, (0.161, 0.980) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8ce094dd4cf2c9e.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, gray cotton shirt at upper left or gray fabric pants at center?" }, { "from": "gpt", "value": "gray fabric pants at center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82f2a2b90625daed.jpg", "conversations": [ { "from": "human", "value": "\nIs frosted grass at center closer to the viewer compared to white frosty bush at center?" }, { "from": "gpt", "value": "Yes, it is in front of white frosty bush at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a83e6719453f06d.jpg", "conversations": [ { "from": "human", "value": "\nHow close is white matte shirt at lower left from blue plastic cooler at lower center?" }, { "from": "gpt", "value": "7.16 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05dc2df87b535ff8.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.436, 0.923) from the camera?" }, { "from": "gpt", "value": "Point (0.436, 0.923) is 59.02 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6bd56c42feaccb1.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, black matte ford fiesta at center or dark green hoodie at center?" }, { "from": "gpt", "value": "Positioned to the left is dark green hoodie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3f0d53306767f00.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.127, 0.825) from camera?" }, { "from": "gpt", "value": "4.02 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4174d7ae06f1036e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte gray shirt at center is smaller than gray matte shirt at center?" }, { "from": "gpt", "value": "Correct, matte gray shirt at center occupies less space than gray matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e15ff1331cebe17.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic gold mask at upper right is positioned below shiny metallic bracelet at left?" }, { "from": "gpt", "value": "Incorrect, metallic gold mask at upper right is not positioned below shiny metallic bracelet at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/998cb4b7697a4675.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of green grass pasture at center?" }, { "from": "gpt", "value": "They are 14.10 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcc101a956f15432.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of teak wood table at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.446, 0.708)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78f8a2f2dfd941a6.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black bass guitar at left shorter than gold metallic saxophone at right?" }, { "from": "gpt", "value": "Correct, matte black bass guitar at left is not as tall as gold metallic saxophone at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef5a3a1161e10864.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.392, 0.720) or (0.859, 0.995)?" }, { "from": "gpt", "value": "The point (0.392, 0.720) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bf56d2cea793bc9.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the smooth water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.510, 0.214)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16e09c356e034115.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the owl in the image. The camera is focused on the point marked as point (0.477, 0.769). Where is the owl located relative to this point?" }, { "from": "gpt", "value": "The brown feathered owl at center is exactly at point (0.477, 0.769), so the owl is located right at the camera focus point." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f646dd732bb8699d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a group photo of the matte green shirt at center and the purple fuzzy coat at lower center. If you want both subjects to appear equally sized in the photo, which subject should you move closer to the camera and by how much?" }, { "from": "gpt", "value": "The purple fuzzy coat at lower center is smaller in width than the matte green shirt at center. To make them appear the same size in the photo, move the purple fuzzy coat at lower center closer to the camera by an amount that compensates for its smaller width compared to the matte green shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f3a64be5da3b4c4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.209, 0.636)?" }, { "from": "gpt", "value": "white paisley shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36428862b76296eb.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position looking at the poster. There is a point marked at coordinates point (0.621, 0.586). How far is that point from you?" }, { "from": "gpt", "value": "The point (0.621, 0.586) is 37.51 inches away from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ef0fabc27d7cd3e.jpg", "conversations": [ { "from": "human", "value": "\nLocate white plastic microscope at center in the image." }, { "from": "gpt", "value": "[(0.523, 0.730)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32227d2914b073a6.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian trying to navigate through the market area. There is an orange reflective diamond shaped sign at center. Where exactly is this sign located in relation to the point you are standing at coordinates point (0.424, 0.444)?" }, { "from": "gpt", "value": "The orange reflective diamond shaped sign at center is located exactly at the point you are standing at coordinates point (0.424, 0.444)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb0c8a84919ea11e.jpg", "conversations": [ { "from": "human", "value": "\nWhere is granite rock formation at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.558, 0.325)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/446ba90d4ffee67c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of bare wood tree at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.530, 0.242)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db09e0d54e828094.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte jacket at center below dark gray jacket at left?" }, { "from": "gpt", "value": "Indeed, black matte jacket at center is positioned under dark gray jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d008a1adda83788a.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of dark blue jersey at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.757, 0.484)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58ede87ccd2bf38c.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.733, 0.528)?" }, { "from": "gpt", "value": "brown suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcc6d7df2e9c2844.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the brown stone statue at center and the green grass at lower center in a single shot. Based on their sizes, which object should appear larger in the photo?" }, { "from": "gpt", "value": "The brown stone statue at center should appear larger in the photo because it has a greater height compared to the green grass at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d67dc6610ba69b3.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in a traditional Japanese garden and want to take a photo of the wooden gazebo at center. If your camera has a maximum focus range of 10 feet, will you be able to capture the gazebo clearly?" }, { "from": "gpt", "value": "The wooden gazebo at center is 8.95 feet away from the viewer. Since this distance is within the camera maximum focus range of 10 feet, the gazebo can be captured clearly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0771d336e5d9e9f0.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the dark brown fur monkey at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.465, 0.441)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ce21d0e54cbc24f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to place a package on the desk. The package is 1.8 meters long. Can you fit it between the red matte shirt at center and the camera?" }, { "from": "gpt", "value": "The distance between the red matte shirt at center and the camera is 1.73 meters. Since the package is 1.8 meters long, it cannot fit between them as the space is shorter than the package." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d92465340fe8d9f4.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, white matte t-shirt at center or white matte t-shirt at right?" }, { "from": "gpt", "value": "Positioned lower is white matte t-shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/883cfe5aecf96ca1.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to white plastic printer at right? Please provide its 2D coordinates.Where can I find white plastic printer at right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.942, 0.353)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3abac486d0e5bbea.jpg", "conversations": [ { "from": "human", "value": "\nDoes white plastic table at center have a smaller size compared to black matte microphone at center?" }, { "from": "gpt", "value": "No, white plastic table at center is not smaller than black matte microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e53e00d96821b9f4.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the blue glossy fountain at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.535, 0.745)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/008988b1a77005be.jpg", "conversations": [ { "from": "human", "value": "\nIs green mesh running shoe at lower center taller than matte green and yellow hiking boot at lower center?" }, { "from": "gpt", "value": "Yes, green mesh running shoe at lower center is taller than matte green and yellow hiking boot at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0360e4ecb6491b93.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of beige plastic hospital bed at lower center from camera?" }, { "from": "gpt", "value": "A distance of 1.54 meters exists between beige plastic hospital bed at lower center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3122d7e354061d3f.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the brown stone church at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.468, 0.408)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65334f1627f824f1.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the Dutch building and notice two people sitting on the steps. One is wearing a dark gray leather jacket at center and the other has a gray textured vest at center. Which clothing item is positioned lower on the person?" }, { "from": "gpt", "value": "The dark gray leather jacket at center is located below the gray textured vest at center, so the dark gray leather jacket at center is positioned lower on the person." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65033b22c3e69991.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange cotton shirt at center have a smaller size compared to black matte video camera at lower center?" }, { "from": "gpt", "value": "Incorrect, orange cotton shirt at center is not smaller in size than black matte video camera at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/989c95f55b3be2a5.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.902, 0.359) or (0.631, 0.230)?" }, { "from": "gpt", "value": "Point (0.631, 0.230)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/564b26e8d50854c0.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.756, 0.909) positioned after point (0.701, 0.886)?" }, { "from": "gpt", "value": "No, (0.756, 0.909) is in front of (0.701, 0.886)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42ce5204fa6d5802.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, green corrugated metal hut at lower left or brown wooden boat at lower left?" }, { "from": "gpt", "value": "green corrugated metal hut at lower left is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b818021ea5d20ea8.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.176, 0.825) or (0.921, 0.936)?" }, { "from": "gpt", "value": "Positioned behind is point (0.176, 0.825)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/660d55c15eb54f10.jpg", "conversations": [ { "from": "human", "value": "\nYou are a game master preparing a tabletop game. You have two dice sets, the translucent red dice at left and the white matte dice at left. The game rules state that these two dice must be placed at least 20 inches apart to avoid interference. Based on the scene description, can you confirm if the current placement meets the rule requirements?" }, { "from": "gpt", "value": "The distance between the translucent red dice at left and white matte dice at left is 20.53 inches, which exceeds the minimum requirement of 20 inches. Therefore, the current placement meets the rule requirements." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43d9981162920d23.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, white matte blood pressure cuff at center or white matte ear at upper left, stands taller?" }, { "from": "gpt", "value": "white matte blood pressure cuff at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e0f66b533744ab8.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.717, 0.250) more distant than point (0.554, 0.603)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc4dc0aa8f47c736.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue shirt at lower left to the left of light blue denim jacket at center from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, matte blue shirt at lower left is positioned on the left side of light blue denim jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/398d7a85a6416910.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any white matte shirt at center in the image." }, { "from": "gpt", "value": "[(0.560, 0.600)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22c79f898e5006f1.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.379, 0.920) positioned after point (0.408, 0.684)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a0b1e85bee32718.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue fabric tank top at center appear over shiny black shorts at upper left?" }, { "from": "gpt", "value": "No, blue fabric tank top at center is not above shiny black shorts at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6351686d87ea27c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.824, 0.738) or point (0.356, 0.434)?" }, { "from": "gpt", "value": "Point (0.824, 0.738) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c11d4b35c505e503.jpg", "conversations": [ { "from": "human", "value": "\nYou are a painter who wants to paint the scene. You have a canvas that can only accommodate objects up to the width of the metallic pole at upper right. Can you fit the concrete wall at center onto your canvas?" }, { "from": "gpt", "value": "The concrete wall at center is narrower than the metallic pole at upper right, so yes, the concrete wall at center can fit on the canvas since its width is less than the maximum width allowed." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7624137b1b404074.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.914, 0.248) and camera." }, { "from": "gpt", "value": "14.47 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d3f747bf9464dd7.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of bright orange corrugated metal shipping container at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.560, 0.789)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/124e8175c781d60e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the concrete bridge at center and looking towards the river. Which direction should you turn to see the dark blue water at center?" }, { "from": "gpt", "value": "You should turn to your right because the dark blue water at center is to the right of the concrete bridge at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a2edfcab01380fa.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tourist standing in front of the matte beige building at left and want to visit the gold ornate tower at center. How far do you have to walk to reach the tower?" }, { "from": "gpt", "value": "The matte beige building at left is 17.12 meters away from the gold ornate tower at center, so you have to walk 17.12 meters to reach the tower." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e1c46366b8bf889.jpg", "conversations": [ { "from": "human", "value": "\nYou are an art curator standing in the exhibition space. You need to guide a visitor to the green matte shirt at center. Which direction should they move from the brown wooden statue at upper left?" }, { "from": "gpt", "value": "The visitor should move to the right from the brown wooden statue at upper left to reach the green matte shirt at center, as the statue is positioned to the left of the shirt." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34d7c551088c71dd.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.619, 0.748)?" }, { "from": "gpt", "value": "charred wood fire at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e760c938b5da91d1.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the image and want to find the green leafy tree at center. According to the coordinates provided, in which direction should you look to locate it?" }, { "from": "gpt", "value": "The green leafy tree at center is located at coordinates approximately 0.588 on the x axis and 0.752 on the y axis. Since you are at the center of the image, which would be at coordinates approximately 0.5 on both axes, the tree is slightly to the right and above your current position. Therefore, you should look to the upper right direction to locate the green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2951a41fd42772e.jpg", "conversations": [ { "from": "human", "value": "\nIs white distressed wood door at center thinner than yellow metallic taxi at left?" }, { "from": "gpt", "value": "In fact, white distressed wood door at center might be wider than yellow metallic taxi at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57bcecfe485c6529.jpg", "conversations": [ { "from": "human", "value": "\nIs dirt path at center positioned in front of yellow fabric tent at center-right?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ea30f66fe0874a1.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black suit at left have a lesser width compared to matte black tie at left?" }, { "from": "gpt", "value": "No, matte black suit at left is not thinner than matte black tie at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38b7f61dac1501dd.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white matte shorts at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.496, 0.667)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5838c3fdf176dc84.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the spotted yellow fish at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.506, 0.195)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7023e52827202a26.jpg", "conversations": [ { "from": "human", "value": "\nYou are helping to arrange furniture in a living room. You have a matte black shirt at center and a matte black couch at center. Which object should you place first if you want to ensure there is enough space for both?" }, { "from": "gpt", "value": "You should place the matte black couch at center first since it is larger in size than the matte black shirt at center, ensuring there is enough space for both objects." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2af7a53ec1de9619.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.683, 0.170) to camera." }, { "from": "gpt", "value": "Point (0.683, 0.170) and camera are 6.00 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0a28d50b066ad05.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white painted wood bookshelf at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.852, 0.414)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/285a27a72eb5aa36.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of green reflective water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.528, 0.309)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bd8563effd01e48.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.816, 0.477) and point (0.129, 0.641), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.816, 0.477)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3637ac275eb6dc0c.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic silver shovel at center wider than blue woolen sweater at upper center?" }, { "from": "gpt", "value": "In fact, metallic silver shovel at center might be narrower than blue woolen sweater at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1878be8b9b7c63a4.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.443, 0.997) to camera." }, { "from": "gpt", "value": "The distance of point (0.443, 0.997) from camera is 5.36 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f67f1362d7db5586.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, pink fabric shorts at center or skinny white man at right, stands taller?" }, { "from": "gpt", "value": "pink fabric shorts at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cdfb3161cb57164d.jpg", "conversations": [ { "from": "human", "value": "\nLooking at the golden ornament against the blue sky, where is the gold polished cherub at center in relation to the gold polished pole at center?" }, { "from": "gpt", "value": "The gold polished cherub at center is to the left of the gold polished pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85ccfea54223c713.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of green leafy tree at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.488, 0.342)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e32e2039f6e44a0.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of smooth asphalt road at center?" }, { "from": "gpt", "value": "They are 10.99 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b0fabaacdf2befc.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.306, 0.695)?" }, { "from": "gpt", "value": "black-and-white fur cat at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b82b8766c5f5b52.jpg", "conversations": [ { "from": "human", "value": "\nBetween shiny metallic armor at left and camouflage fabric rifle at right, which one is positioned higher?" }, { "from": "gpt", "value": "shiny metallic armor at left is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c167bc6bc4e734d8.jpg", "conversations": [ { "from": "human", "value": "\nPoint to wooden table at center.Point to the wooden table at center in the image." }, { "from": "gpt", "value": "[(0.678, 0.872)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/034990b9efc866c5.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the venue and see the point marked at coordinates (0.748, 0.653). Which object in the scene does this point belong to?" }, { "from": "gpt", "value": "The point marked at coordinates (0.748, 0.653) belongs to the black wool coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f24cd35e701d7ce.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer adjusting your camera settings to capture the scene. You notice two points of interest in the image, labeled as point (0.623, 0.206) and point (0.140, 0.716). Which point should you focus on first if you want to ensure the closest object is in sharp focus?" }, { "from": "gpt", "value": "Point (0.623, 0.206) should be focused on first because it is closer to the camera than point (0.140, 0.716), ensuring the closest object is in sharp focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bee727593185472d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy screen at upper center is thinner than light brown wooden desk at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ffcc002bdf9c631.jpg", "conversations": [ { "from": "human", "value": "\nIs white smoke at left to the left of smooth gravel track at center from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, white smoke at left is positioned on the left side of smooth gravel track at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44d916f2d09c8ae7.jpg", "conversations": [ { "from": "human", "value": "\nLocate gray matte shirt at center in the image." }, { "from": "gpt", "value": "[(0.278, 0.614)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74377154301b7551.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.725, 0.969) in front of point (0.931, 0.353)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.931, 0.353)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba58fcde60d639a7.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.178, 0.364) or point (0.531, 0.356)?" }, { "from": "gpt", "value": "Point (0.178, 0.364) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd18304dc3556234.jpg", "conversations": [ { "from": "human", "value": "\nYou are an interior designer working on a project and need to know the distance between the blue fabric cap at left and the matte blue baseball cap at left. Can you confirm if they are more than 4 centimeters apart?" }, { "from": "gpt", "value": "The blue fabric cap at left is 4.20 centimeters away from the matte blue baseball cap at left, so yes, they are more than 4 centimeters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5eec0264c77815d.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.518, 0.345) farther from viewer compared to point (0.576, 0.458)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be535b2888882417.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any metallic silver van at lower right in the image." }, { "from": "gpt", "value": "[(0.919, 0.739)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36144051635fc5f9.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between silhouette fabric at left and camera." }, { "from": "gpt", "value": "They are 2.91 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a7ae6d37639ff27.jpg", "conversations": [ { "from": "human", "value": "\nDoes foggy translucent morning fog at upper center have a greater height compared to green leafy bush at center?" }, { "from": "gpt", "value": "Yes, foggy translucent morning fog at upper center is taller than green leafy bush at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4487044075848c5f.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of smokey gray fur at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.341, 0.208)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9083b63354677229.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a brown rough bark tree at left. Pinpoint a point to the brown rough bark tree at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.127, 0.214)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75edb6daaabf2982.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, bare branches at upper right or green leafy tree at lower right?" }, { "from": "gpt", "value": "Positioned to the left is green leafy tree at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddfc9081e5ee8dc1.jpg", "conversations": [ { "from": "human", "value": "\nIs green fabric climbing harness at upper center smaller than matte green long-sleeve shirt at upper center?" }, { "from": "gpt", "value": "No, green fabric climbing harness at upper center is not smaller than matte green long-sleeve shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fdc4432d6c53bde.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of blue water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.675, 0.878)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/feb832a8b074a476.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray t-shirt at center is thinner than black striped shirt at center?" }, { "from": "gpt", "value": "Indeed, dark gray t-shirt at center has a lesser width compared to black striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1adae95af67495cc.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green artificial turf at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.458, 0.830)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18df1e1690775617.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte water at center bigger than white plastic boat at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/483d31276c9630ec.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the matte gray shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.435, 0.778)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91de45e6a0dd5e60.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.288, 0.630) closer to viewer compared to point (0.143, 0.611)?" }, { "from": "gpt", "value": "Yes, point (0.288, 0.630) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/973bf9b0754146fe.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown matte plate at center is shorter than brown matte saucer at lower left?" }, { "from": "gpt", "value": "In fact, brown matte plate at center may be taller than brown matte saucer at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3dafea103a28fe5.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.346, 0.925) to camera." }, { "from": "gpt", "value": "Point (0.346, 0.925) and camera are 11.59 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd91b76deb297246.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.898, 0.580) closer to camera compared to point (0.631, 0.592)?" }, { "from": "gpt", "value": "No, (0.898, 0.580) is further to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98f1375d44892845.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.373, 0.688) or (0.585, 0.992)?" }, { "from": "gpt", "value": "Positioned in front is point (0.585, 0.992)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52542ba9a2eaddc1.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point labeled as point (0.495, 0.533) and want to take a selfie with the camera. How far do you need to walk to reach the camera?" }, { "from": "gpt", "value": "You need to walk 8.10 meters to reach the camera from point (0.495, 0.533)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/350c8e7f6a40b208.jpg", "conversations": [ { "from": "human", "value": "\nHow close is matte gray t-shirt at left from camera?" }, { "from": "gpt", "value": "3.79 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da76a0df2aa0c5b9.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between white glossy bathtub at center and black matte picture frame at upper center?" }, { "from": "gpt", "value": "white glossy bathtub at center and black matte picture frame at upper center are 3.83 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ea3669e150bef0f.jpg", "conversations": [ { "from": "human", "value": "\nWhere is blue fleece jacket at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.675, 0.686)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71705f1cfb181ec3.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.526, 0.603) and point (0.834, 0.978), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.834, 0.978)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59c87bf2b7706ce3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.492, 0.541)?" }, { "from": "gpt", "value": "white glass tower at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d09bbb20f24a41d.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.475, 0.291) and point (0.765, 0.450), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.765, 0.450)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07e8cdaeeada2137.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green matte tree at upper right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.894, 0.139)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f279451ee3ef803d.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.278, 0.848) positioned after point (0.454, 0.511)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27aabea3f616f19a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the glossy wood door at center and want to reach the transom window above it. How far do you need to stretch your hand to touch the transom window?" }, { "from": "gpt", "value": "The glossy wood door at center and the transom window are 14.81 feet apart, so you need to stretch your hand 14.81 feet to touch the transom window." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e333e97fb65441b3.jpg", "conversations": [ { "from": "human", "value": "\nIs matte green backpack at center closer to the viewer compared to matte blue backpack at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0037df9f4ad04cf5.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of black checkered board at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.520, 0.903)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59540865277860dc.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, vintage paper-toned tonique at center or orange paper bottle at center, stands shorter?" }, { "from": "gpt", "value": "Standing shorter between the two is orange paper bottle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58995274339057b0.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the matte purple jacket at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.519, 0.584)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e583f6fa777986c.jpg", "conversations": [ { "from": "human", "value": "\nIs light pink lace sweater at center behind matte black sweater at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7c32b68aa51eb48.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver metallic car at lower left appear under transparent glass car window at center?" }, { "from": "gpt", "value": "Correct, silver metallic car at lower left is located below transparent glass car window at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/698a6bf5205fb180.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.739, 0.742) or point (0.037, 0.581)?" }, { "from": "gpt", "value": "Point (0.037, 0.581)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17ea7925e34054d1.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte watermelon at lower left have a greater width compared to white plastic goggles at upper center?" }, { "from": "gpt", "value": "Yes, green matte watermelon at lower left is wider than white plastic goggles at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc51650e0a45e610.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.676, 0.245) farther from camera compared to point (0.567, 0.466)?" }, { "from": "gpt", "value": "No, (0.676, 0.245) is in front of (0.567, 0.466)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4dd79439f7d8278.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the purple striped shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.639, 0.744)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c49a9f711fd8548c.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.151, 0.797) and point (0.349, 0.295), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.151, 0.797) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6882df0a4ea0a668.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny green and white car at center smaller than shiny red toy car at center?" }, { "from": "gpt", "value": "Actually, shiny green and white car at center might be larger than shiny red toy car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d22cb325333b38e3.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.917, 0.133) or (0.040, 0.881)?" }, { "from": "gpt", "value": "Positioned in front is point (0.040, 0.881)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/686c8399d7f0c7f4.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any green grassy at center in the image." }, { "from": "gpt", "value": "[(0.494, 0.844)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abb4521d03e642e6.jpg", "conversations": [ { "from": "human", "value": "\nHow much distance is there between white matte backpack at center and white t-shirt at center?" }, { "from": "gpt", "value": "A distance of 25.40 meters exists between white matte backpack at center and white t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ba6fea9024982c0.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any matte black bow at center in the image." }, { "from": "gpt", "value": "[(0.337, 0.811)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87c30651648c3234.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing your home office and need to place a new item on the closest drawer to you. Which drawer should you choose between the white matte drawer at upper center and the white matte drawer at upper right?" }, { "from": "gpt", "value": "The white matte drawer at upper center is closer to the viewer than the white matte drawer at upper right, so you should place the new item on the white matte drawer at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73ea0647842d800c.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.647, 0.644) or (0.199, 0.580)?" }, { "from": "gpt", "value": "Positioned behind is point (0.199, 0.580)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cafc8fb80cb402c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to adjust the lighting for a photo shoot. You have a spotlight that can cover an area of 10 inches in diameter. There are two key elements in the scene you need to illuminate properly for the photo. The neon green wig at center and the black dotted fabric dress at center. Can the spotlight illuminate both elements at the same time without moving it?" }, { "from": "gpt", "value": "The distance between the neon green wig at center and the black dotted fabric dress at center is 9.66 inches. Since the spotlight can cover 10 inches in diameter, it can illuminate both elements simultaneously without needing to move it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a4e89fee4f85de1.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.338, 0.613) or point (0.679, 0.556)?" }, { "from": "gpt", "value": "Positioned behind is point (0.338, 0.613)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c91057646bcd599f.jpg", "conversations": [ { "from": "human", "value": "\nPoint to blue printed swimsuit at center.Point to the blue printed swimsuit at center in the image." }, { "from": "gpt", "value": "[(0.319, 0.733)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8288d0d515202e33.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.203, 0.845) and point (0.681, 0.977), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.203, 0.845) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1eadd4f10b955ea6.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of smooth white shirt at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.770, 0.366)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3300780aaa74f45.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the denim jacket at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.019, 0.780)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7e6a45c2734105b.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of yellow glass traffic light at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.510, 0.791)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fc5fe1d22e66598.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.943, 0.227) in front of point (0.447, 0.089)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/959ad482102c39f0.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.916, 0.359) and point (0.719, 0.530), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.719, 0.530) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9f8915a6e6f4e2a.jpg", "conversations": [ { "from": "human", "value": "\nYou are an attendee at this presentation and need to place your brown fabric purse at lower right on the floor next to the green fabric uniform at left. Will the purse fit vertically without overlapping the uniform?" }, { "from": "gpt", "value": "The brown fabric purse at lower right is not as tall as the green fabric uniform at left, so it can be placed vertically next to the uniform without overlapping." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac55b6d8fc3107f6.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the white matte cabinet at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.400, 0.694)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40f28e4c3efbcbb0.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of matte brown guitar at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.091, 0.466)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76e244fe4ef9a2e6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the viewpoint overlooking the city and want to know the distance between you and the brown textured rooftops at center. Can you estimate how far you are from them?" }, { "from": "gpt", "value": "The brown textured rooftops at center are 451.65 feet away from the viewer, so you are approximately 451.65 feet away from them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aec7542974762bcf.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.245, 0.163) and point (0.457, 0.780), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.457, 0.780)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90635edda1c29c4f.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white matte building at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.565, 0.580)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3090cf6f3c53b7b2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a coach standing at the sideline of the football field. You want to ensure that the green grass at center and the white matte jersey at center are positioned correctly for a play. What is the distance between them?" }, { "from": "gpt", "value": "The distance between the green grass at center and the white matte jersey at center is 10.72 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c6162459de9614c.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a photo shoot and need to ensure that the black cotton shirt at center and the green leather jacket at right are visible in the frame. Given that the camera has a zoom lens that can adjust focus, which clothing item might require closer attention to ensure clarity due to its size?" }, { "from": "gpt", "value": "The black cotton shirt at center has a larger size compared to the green leather jacket at right, so it might require closer attention to ensure clarity due to its larger size." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f851e4d27a828810.jpg", "conversations": [ { "from": "human", "value": "\nDoes black satin dress at center appear on the right side of matte black dress at center?" }, { "from": "gpt", "value": "Indeed, black satin dress at center is positioned on the right side of matte black dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07966c477ae78147.jpg", "conversations": [ { "from": "human", "value": "\nLocate all satin white sedan at center in the image." }, { "from": "gpt", "value": "[(0.369, 0.580)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98618ca27d791c6f.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue dress at center positioned in front of matte blue sailor dress at center?" }, { "from": "gpt", "value": "Yes, matte blue dress at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61c7986ef175b6dd.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of glossy plastic bird feeder at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.548, 0.419)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b95d0984f668b111.jpg", "conversations": [ { "from": "human", "value": "\nLocate all satin blue suit at left in the image." }, { "from": "gpt", "value": "[(0.200, 0.675)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a399f26e643c47c7.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.429, 0.684)?" }, { "from": "gpt", "value": "7.30 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/080dd3e32740bf23.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.639, 0.639)?" }, { "from": "gpt", "value": "satin metallic suv at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6ca852a30a485f5.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.784, 0.380) and camera?" }, { "from": "gpt", "value": "A distance of 13.37 meters exists between point (0.784, 0.380) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84337c672d511041.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.653, 0.887) farther from camera compared to point (0.990, 0.939)?" }, { "from": "gpt", "value": "Yes, point (0.653, 0.887) is behind point (0.990, 0.939)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6015ce08e5b94338.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the metallic reflective letter w at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.498, 0.409)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ff7fa1db1cad57b.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between white matte shirt at center and camera." }, { "from": "gpt", "value": "They are 35.72 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/201e9a5331e232ec.jpg", "conversations": [ { "from": "human", "value": "\nBetween multicolored leotard at upper left and white matte shirt at upper right, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "white matte shirt at upper right is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c2a7bf3dd2c591e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the festive float and want to take a photo of the point at coordinates point (0.209, 0.259). Based on its distance from you, would you need to zoom in or out to frame it properly?" }, { "from": "gpt", "value": "The point (0.209, 0.259) is 13.95 feet away from the viewer. To frame it properly, you would need to zoom out to capture the entire float and the point at that distance." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e83b2575f129fbc7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray fabric shirt at center is shorter than graywoollybeard at right?" }, { "from": "gpt", "value": "In fact, gray fabric shirt at center may be taller than graywoollybeard at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/563ac0a1381875a0.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point labeled point (0.207, 0.780) and want to walk to the point labeled point (0.867, 0.752). Given that both points are on the same riverbank, which direction should you face to move towards your destination?" }, { "from": "gpt", "value": "You should face towards the upper part of the river because point (0.867, 0.752) is further away from the camera compared to point (0.207, 0.780), so moving towards it would require heading in the direction away from the camera, which corresponds to the upper part of the river in this perspective." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27981aa10061f2e7.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to read the text on the yellow matte signboard at center and the dark brown hair at lower center. Which object is closer to you?" }, { "from": "gpt", "value": "The yellow matte signboard at center is closer to you because it is in front of the dark brown hair at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1e83f89abae1d45.jpg", "conversations": [ { "from": "human", "value": "\nHow far apart are red metal fence at right and yellow paper sign at right?" }, { "from": "gpt", "value": "They are 29.76 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36dca906e4e7d62a.jpg", "conversations": [ { "from": "human", "value": "\nBetween brown leather hat at center and denim jacket at lower left, which one has more height?" }, { "from": "gpt", "value": "Standing taller between the two is brown leather hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69cec73ddb3ba7e8.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any green grassy hillside at lower center in the image." }, { "from": "gpt", "value": "[(0.343, 0.655)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/231da4f4cfef91de.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.884, 0.645) or point (0.513, 0.606)?" }, { "from": "gpt", "value": "Positioned behind is point (0.513, 0.606)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4e3b1f2f80fba7f.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of green matte shirt at center?" }, { "from": "gpt", "value": "A distance of 3.58 meters exists between green matte shirt at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2caa537bf0361234.jpg", "conversations": [ { "from": "human", "value": "\nYou are a farmer who needs to separate the black fuzzy alpaca at center from the light beige woolen camel at upper left. What is the minimum distance you need to move one of them to ensure they are at least 5 feet apart?" }, { "from": "gpt", "value": "The current distance between the black fuzzy alpaca at center and the light beige woolen camel at upper left is 4.45 feet. To achieve a minimum of 5 feet apart, you need to move one of them by at least 0.55 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80116e68f62d8d96.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.493, 0.778) from camera?" }, { "from": "gpt", "value": "Point (0.493, 0.778) is 24.88 inches away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/395de8f671b23f7d.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between black satin tuxedo at center and camera." }, { "from": "gpt", "value": "They are 5.72 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30a6fbee14858886.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte white shirt at center have a lesser width compared to shiny black car at upper right?" }, { "from": "gpt", "value": "Correct, matte white shirt at center's width is less than shiny black car at upper right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85c46342fe621927.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the green rough bark tree at left. Based on its position in the scene, can you determine if it is closer to you or further away compared to the other elements in the background?" }, { "from": "gpt", "value": "The green rough bark tree at left is located at point (0.079, 0.773), which places it closer to the foreground compared to the background elements, so it is closer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56676d2b32e0c8ea.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of weathered wood barn at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.438, 0.536)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/167f857b1498dc11.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black glasses at upper left to the right of black plastic glasses at left from the viewer's perspective?" }, { "from": "gpt", "value": "In fact, matte black glasses at upper left is to the left of black plastic glasses at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb6594c34189c9ad.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if glossy plastic traffic cone at center is thinner than metallic green traffic sign at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/945414f1576baf09.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the pink woolen gloves at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.528, 0.658)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/735f2a2a3567d6c5.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of white glossy electric guitar at center right from camera?" }, { "from": "gpt", "value": "white glossy electric guitar at center right and camera are 10.30 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75dd8dc8f53e7dca.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the yellow corduroy sweater at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.415, 0.586)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a61baef7a1b5787a.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to light blue fabric shirt at center? Please provide its 2D coordinates.Where can I find light blue fabric shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.062, 0.625)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56d82cb62cd9e2d3.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the orange matte table at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.223, 0.914)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e01b1863d3495702.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue metallic license plate at center is bigger than denim jacket at lower right?" }, { "from": "gpt", "value": "No, blue metallic license plate at center is not bigger than denim jacket at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13a2fbba3e86c340.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the matte ceramic mug at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.321, 0.658)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54ffedfb07675781.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.683, 0.478) and camera." }, { "from": "gpt", "value": "The distance of point (0.683, 0.478) from camera is 4.81 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fbf685a80431679.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the gray cotton shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.452, 0.530)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98b539bec4082798.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.440, 0.537)?" }, { "from": "gpt", "value": "stone castle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19e041bc0fe1bda2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gold metallic twenty pence at center is bigger than silver/golden metallic five pence at center?" }, { "from": "gpt", "value": "Indeed, gold metallic twenty pence at center has a larger size compared to silver/golden metallic five pence at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc5b942fe201a3e3.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped fabric shirt at center have a greater width compared to black plastic speaker at upper left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fee37f3137e4978.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green leafy trees at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.745, 0.425)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df36e65d013bfbd6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light brown hair at center is positioned above green grass train track at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71d6219c2185d4c9.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.646, 0.359) or (0.694, 0.588)?" }, { "from": "gpt", "value": "Point (0.646, 0.359) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7d8ab27b2a56f4d.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.170, 0.619) positioned behind point (0.866, 0.430)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21a69526532ff35b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the matte red shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.657, 0.550)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6b9a8ce25cfdad5.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray rocky mountain at upper center come in front of blue glossy motorcycle at center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d45a2c5394c60177.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, dark brown leather jacket at right or matte black sweater at center?" }, { "from": "gpt", "value": "matte black sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c5afae3c775df05.jpg", "conversations": [ { "from": "human", "value": "\nDoes white smooth fish at center appear under smooth black rod at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6da81d580f8da0ff.jpg", "conversations": [ { "from": "human", "value": "\nYou are a construction worker standing at the edge of the construction site. You need to locate the yellow metallic excavator at center. According to the coordinates provided, where exactly is it located?" }, { "from": "gpt", "value": "The yellow metallic excavator at center is located at coordinates point (0.728, 0.406)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a44a8fee57852821.jpg", "conversations": [ { "from": "human", "value": "\nPoint to brown dirt track at center.Point to the brown dirt track at center in the image." }, { "from": "gpt", "value": "[(0.438, 0.800)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f70c133bb09651d.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center shorter than white matte cricket bat at right?" }, { "from": "gpt", "value": "Indeed, green grass at center has a lesser height compared to white matte cricket bat at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00da4daeb67656b8.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of plaid fabric at center in the image." }, { "from": "gpt", "value": "[(0.687, 0.912)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76185fb093a525b1.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.232, 0.336) or point (0.706, 0.939)?" }, { "from": "gpt", "value": "Positioned in front is point (0.706, 0.939)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59126bf2f5c3064e.jpg", "conversations": [ { "from": "human", "value": "\nLocate matte plastic mirror at center in the image." }, { "from": "gpt", "value": "[(0.530, 0.533)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/936951de7b9a5f8d.jpg", "conversations": [ { "from": "human", "value": "\nBetween gray woolen suit at center and brown wooden table at center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, brown wooden table at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de1f9ddfb530e08d.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the dark brown fabric pants at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.470, 0.777)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9635995d2cbf0227.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.049, 0.642) and camera?" }, { "from": "gpt", "value": "1.16 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6be74877e978ecc.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.627, 0.463) or (0.469, 0.678)?" }, { "from": "gpt", "value": "Point (0.469, 0.678) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe12e73037002707.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth concrete stairs at center closer to the viewer compared to purple floral swimsuit at right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb71f4418bbefd7b.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte black dress at center and striped fabric dress at center, which one is positioned lower?" }, { "from": "gpt", "value": "Positioned lower is matte black dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc7522bdd5f98ba2.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.456, 0.191) come farther from viewer compared to point (0.400, 0.408)?" }, { "from": "gpt", "value": "Yes, point (0.456, 0.191) is farther from viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa2da77fa04f4771.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the gymnasium entrance. You want to take a photo of the blue jersey at center and the white cotton shirt at center. Which of the two will appear wider in the photo?" }, { "from": "gpt", "value": "The blue jersey at center will appear wider in the photo because its width surpasses that of the white cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cefd1bfe67028a37.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.899, 0.662) in front of point (0.646, 0.278)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7bca6a77bae68dc2.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the dark blue fabric cap at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.132, 0.972)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4973565ef4809b7.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green leafy tree at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.844, 0.181)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f886d8f46c7f470c.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.042, 0.473) farther from viewer compared to point (0.764, 0.047)?" }, { "from": "gpt", "value": "No, (0.042, 0.473) is in front of (0.764, 0.047)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd0faa5e2fe231f1.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth red train at right bigger than smooth concrete path at center?" }, { "from": "gpt", "value": "Incorrect, smooth red train at right is not larger than smooth concrete path at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db3afd84b55995e8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white lace dress at center is positioned below orange velvet robe at left?" }, { "from": "gpt", "value": "Incorrect, white lace dress at center is not positioned below orange velvet robe at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1d78ba8087a685a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, blue plastic toy at center or purple fabric shirt at upper left?" }, { "from": "gpt", "value": "blue plastic toy at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a2932633f7dd66b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green matte tree at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.198, 0.744)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf110b7f109a18f9.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a natural wood table at center. Pinpoint a point to the natural wood table at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.571, 0.531)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db039419de4503ae.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.972, 0.492) more distant than point (0.545, 0.456)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94a212b3770c96c8.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.604, 0.706) and point (0.710, 0.550), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.710, 0.550)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5b3ce992b1e0246.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.881, 0.200)?" }, { "from": "gpt", "value": "brown velvet elk at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c54e9eaddd271f1.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect reviewing the construction site. You notice the concrete at center and the metallic scaffolding at center. Which of these two elements has a larger size according to the description?" }, { "from": "gpt", "value": "The metallic scaffolding at center is larger than the concrete at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bcca9a7ec9a9692.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between black fabric jacket at left and camera." }, { "from": "gpt", "value": "black fabric jacket at left and camera are 4.99 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04cb8c468258968c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if silver metallic minivan at lower right is positioned to the left of metallic blue car at lower right?" }, { "from": "gpt", "value": "In fact, silver metallic minivan at lower right is to the right of metallic blue car at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2df72904a60b1fcd.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the matte black suit at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.292, 0.623)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0b74f458b71e9ca.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a closeup of the matte pink coat at lower center. Based on the coordinates provided, which direction should you move your camera to focus on it?" }, { "from": "gpt", "value": "The matte pink coat at lower center is located at coordinates point (0.388, 0.762). To focus on it, move the camera towards the lower center direction." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10d82a2fcd9faee1.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green fabric cap at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.623, 0.808)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cdf4f4eff77b9db4.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between rainbow striped socks at lower left and camera." }, { "from": "gpt", "value": "rainbow striped socks at lower left is 21.58 inches away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec91adf0fedf26d2.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white wood door at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.308, 0.541)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb11dc80a3eccee0.jpg", "conversations": [ { "from": "human", "value": "\nHow close is matte black dress at center from smooth black coat at left?" }, { "from": "gpt", "value": "The distance of matte black dress at center from smooth black coat at left is 8.44 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ce242d4e60a6454.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, light blue fabric uniform at right or white uniform at center, stands taller?" }, { "from": "gpt", "value": "Standing taller between the two is light blue fabric uniform at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff48e24c5915fec7.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black suit at center thinner than brown suede pillow at upper left?" }, { "from": "gpt", "value": "Incorrect, matte black suit at center's width is not less than brown suede pillow at upper left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d9bc27475c4ac8a.jpg", "conversations": [ { "from": "human", "value": "\nPoint to green leafy tree at center.Point to the green leafy tree at center in the image." }, { "from": "gpt", "value": "[(0.642, 0.364)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58f6025c111bd3a4.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance measurement between green leafy coconut tree at right and clear blue water at lower left?" }, { "from": "gpt", "value": "green leafy coconut tree at right is 5.42 meters away from clear blue water at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5805798037abba13.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a closeup shot of the white striped shirt at center and the yellow fabric at upper right. The camera you are using has a maximum focus range of 6 inches. Can you fit both objects within the camera frame without moving the camera?" }, { "from": "gpt", "value": "The white striped shirt at center and yellow fabric at upper right are 6.05 inches apart from each other, which is slightly more than the camera maximum focus range of 6 inches. Therefore, you cannot fit both objects within the camera frame without moving the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfb14c658f764e14.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the floral fabric skirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.508, 0.448)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ceaa3c2ce2c35b4d.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.271, 0.713)?" }, { "from": "gpt", "value": "purple fabric backpack at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b7a332c8830cf88.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.108, 0.139) come behind point (0.792, 0.695)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/653c4b5a307e2b26.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of silver metallic suv at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.403, 0.778)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ac67c58afa8688f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tourist standing at the edge of the dark blue water at lower left, looking towards the white stone castle at center. Which direction should you head to reach the castle?" }, { "from": "gpt", "value": "The white stone castle at center is to the right of dark blue water at lower left, so you should head to the right to reach the castle." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c995e8174d49658f.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.669, 0.520) and camera." }, { "from": "gpt", "value": "Point (0.669, 0.520) and camera are 26.34 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3cf2fcf8add0c30a.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of green leafy tree at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.688, 0.314)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f59696335274d059.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the gray woolen hat at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.872, 0.850)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9aa181a46318609.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from bare branches at center to camera." }, { "from": "gpt", "value": "bare branches at center is 47.90 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8bf6cd64d3690687.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.430, 0.589) positioned in front of point (0.798, 0.806)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0436269e58f53cb7.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.028, 0.548) and camera?" }, { "from": "gpt", "value": "The distance of point (0.028, 0.548) from camera is 9.25 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f41a5c518ccdf2a.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the yellow matte life vest at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.310, 0.708)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63de2a1476c51c2e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to park your motorcycle exactly 60 feet away from the brown wooden pole at left. Given that your motorcycle is currently at the shiny chrome motorcycle at center, can you park it in the current spot?" }, { "from": "gpt", "value": "The distance between brown wooden pole at left and shiny chrome motorcycle at center is 62.04 feet. Since 62.04 feet is more than 60 feet, you cannot park the motorcycle at the current spot as it exceeds the required distance." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cb6d6c562f23f15.jpg", "conversations": [ { "from": "human", "value": "\nLocate the white matte shirt at upper right in the image." }, { "from": "gpt", "value": "[(0.932, 0.580)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aae89aa4b3a23a74.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.372, 0.370) and camera?" }, { "from": "gpt", "value": "A distance of 146.99 meters exists between point (0.372, 0.370) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a84221ed78f81ac5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white lace scarf at center is wider than beige lace scarf at center?" }, { "from": "gpt", "value": "Yes, white lace scarf at center is wider than beige lace scarf at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c80373883a7d501e.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of denim jacket at left less distant than that of black matte shirt at upper center?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba72374bc61cd693.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white textured coat at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.768, 0.600)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e316e052a2b54c1.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.469, 0.581) positioned before point (0.210, 0.180)?" }, { "from": "gpt", "value": "No, it is behind (0.210, 0.180)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92649fb260a788f9.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.352, 0.148) or (0.692, 0.853)?" }, { "from": "gpt", "value": "The point (0.352, 0.148) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f884eee91545c08.jpg", "conversations": [ { "from": "human", "value": "\nDoes white satin dress at center come behind matte black suit at center?" }, { "from": "gpt", "value": "No, it is in front of matte black suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1f568607d7574c2.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.448, 0.553) in front of point (0.877, 0.887)?" }, { "from": "gpt", "value": "No, (0.448, 0.553) is behind (0.877, 0.887)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36d05835ae92500e.jpg", "conversations": [ { "from": "human", "value": "\nIs matte white cake at left taller than black glossy/blackberry at center?" }, { "from": "gpt", "value": "Correct, matte white cake at left is much taller as black glossy/blackberry at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/139fdf532b55c393.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer planning to capture the white smooth church at center and the bare wood tree at left in a single shot. Given that your camera has a maximum focal length of 50 meters, will you be able to include both subjects in your photograph?" }, { "from": "gpt", "value": "The white smooth church at center is 26.21 meters from the bare wood tree at left. Since the distance between them is within the camera maximum focal length of 50 meters, you can include both subjects in a single shot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1636636df350e006.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at point (0.821, 0.633) in the scene. How far are you from the camera?" }, { "from": "gpt", "value": "The point (0.821, 0.633) is 1.49 meters away from the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19505908c9bc6eae.jpg", "conversations": [ { "from": "human", "value": "\nCould you provide the distance between black matte figure at center and matte black jacket at center?" }, { "from": "gpt", "value": "black matte figure at center and matte black jacket at center are 33.10 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00a966a52072eaf0.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of light brown leather jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.361, 0.842)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8534976c58c6a5d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if velvet black coat at center is taller than black satin bow tie at center?" }, { "from": "gpt", "value": "Correct, velvet black coat at center is much taller as black satin bow tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a49b73da541dbf50.jpg", "conversations": [ { "from": "human", "value": "\nBetween gray soft baby at center and blue rubber duck at upper center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, gray soft baby at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7132d726bf2cb07.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth metal sign at center have a greater width compared to shiny black sedan at center?" }, { "from": "gpt", "value": "Correct, the width of smooth metal sign at center exceeds that of shiny black sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b926d48db2f105ba.jpg", "conversations": [ { "from": "human", "value": "\nYou are a referee in the gymnasium observing the indoor tchoukball game. You notice two players wearing the black matte jersey at center and the light blue jersey at center. Based on their jersey positions, which player do you think is closer to the basketball hoop mounted on the wooden wall in the background?" }, { "from": "gpt", "value": "The black matte jersey at center is much taller than the light blue jersey at center, so the player wearing the black matte jersey at center is closer to the basketball hoop mounted on the wooden wall in the background." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b1be81a7160ea93.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, light blue shirt at center or green plastic pots at center?" }, { "from": "gpt", "value": "green plastic pots at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b2a45c96d7b1109.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the origin point in the image. Which of the two points, point (0.934, 0.577) or point (0.459, 0.333), is closer to you?" }, { "from": "gpt", "value": "Point (0.934, 0.577) is closer to you because it is in front of point (0.459, 0.333)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e86e28029f87e5a.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.142, 0.670) positioned in front of point (0.376, 0.450)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c867414174aa56ac.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.354, 0.494)?" }, { "from": "gpt", "value": "Point (0.354, 0.494) is 562.73 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9fd29db36e0356f.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth concrete path at center to the right of concrete pillar at center from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, smooth concrete path at center is positioned on the right side of concrete pillar at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/187371137dcaae05.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the base of the green leafy tree at lower left. You want to walk to the entrance of the modern glass building. The entrance is located at the base of the spire. Can you estimate how far you need to walk to reach the entrance?" }, { "from": "gpt", "value": "The distance between the green leafy tree at lower left and the viewer is 213.18 feet. Since the entrance is at the base of the spire, which is part of the building, you would need to walk approximately 213.18 feet from the tree to reach the entrance." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c08d4cf7e414dc55.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, dark brown jacket at center or floral fabric dress at upper left?" }, { "from": "gpt", "value": "Positioned to the right is dark brown jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2db57efec1c5d134.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.887, 0.373)?" }, { "from": "gpt", "value": "white matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0fd0c26bc799f92.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown leather jacket at upper left have a lesser width compared to green marble table at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b9639318d076e5b.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer who needs to place a small microphone stand exactly at the center of the room. The room has a white paper at center. Where should you place the microphone stand?" }, { "from": "gpt", "value": "The white paper at center is located at point (0.339, 0.480), so you should place the microphone stand at that coordinate." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34e523c7a574291e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black suit at center is positioned above teal fabric hand at center?" }, { "from": "gpt", "value": "Correct, matte black suit at center is located above teal fabric hand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee5ef42989d3eaae.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte gray tank top at center is smaller than wooden column at center?" }, { "from": "gpt", "value": "Actually, matte gray tank top at center might be larger than wooden column at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c467493a171d1656.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to enter the cabin through the open door. There is a black rubber wheelchair at lower center and a camouflage fabric shirt at center in the way. Can you walk through the space between them?" }, { "from": "gpt", "value": "The black rubber wheelchair at lower center is larger in size than camouflage fabric shirt at center, so the space between them may be sufficient for you to walk through. However, since the wheelchair is larger, you should check the actual distance before proceeding to ensure safety." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f49126dd3a413da.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.623, 0.350) positioned before point (0.781, 0.672)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a4a22f26cc82c45.jpg", "conversations": [ { "from": "human", "value": "\nBetween metallic honeycomb structure at center and matte gray concrete bench at center, which one has more height?" }, { "from": "gpt", "value": "metallic honeycomb structure at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f7aedfb06c62c19.jpg", "conversations": [ { "from": "human", "value": "\nYou are a spectator at the ski jump event. You see the white glossy skis at lower center and the yellow fabric jacket at right. Which object is located to the left of the other?" }, { "from": "gpt", "value": "The white glossy skis at lower center are positioned on the left side of the yellow fabric jacket at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd9d3db1aeb767bc.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer adjusting your camera to focus on the blonde hair at center and the dark blue knitted blanket at center. Which object should you focus on first to ensure the closest object is sharp?" }, { "from": "gpt", "value": "You should focus on the blonde hair at center first because it is closer to the viewer than the dark blue knitted blanket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c6f246ae5ce7780.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.900, 0.877) or (0.785, 0.625)?" }, { "from": "gpt", "value": "Positioned in front is point (0.785, 0.625)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/440376def6d52eef.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, matte green cushion at right or green fabric bag at center?" }, { "from": "gpt", "value": "With less height is matte green cushion at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcf4c3b43f7664fb.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver who needs to reach the metallic red car at lower left parked near the bushes. You are currently on the black asphalt road at lower right. Can you drive directly to the car without leaving the road?" }, { "from": "gpt", "value": "The distance between the black asphalt road at lower right and metallic red car at lower left is 104.18 feet, so yes, you can drive directly to the metallic red car at lower left along the road since the road connects them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d363fdf2900d8c44.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the dark wooden shelf unit and want to take a photo of the floral porcelain plate at center. If your camera is 5.84 feet away from the plate, will it fit into the frame?" }, { "from": "gpt", "value": "The floral porcelain plate at center and camera are 5.84 feet apart, which means the camera is positioned exactly at the required distance to capture the plate within the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8b472a9347dfd6e.jpg", "conversations": [ { "from": "human", "value": "\nDoes white stone column at left have a greater width compared to white carved column at center?" }, { "from": "gpt", "value": "Correct, the width of white stone column at left exceeds that of white carved column at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d684f31fa6719b6.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white cotton shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.571, 0.453)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1ddb7c015a307e4.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.109, 0.344) or (0.269, 0.673)?" }, { "from": "gpt", "value": "Point (0.109, 0.344) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2e02021f7d1c210.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to matte gray suit at center? Please provide its 2D coordinates.Where can I find matte gray suit at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.704, 0.588)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3121091be9366fff.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a gray asphalt road at lower center. Pinpoint a point to the gray asphalt road at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.588, 0.927)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a9ef8c84fbe9b29.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.325, 0.436) or (0.282, 0.359)?" }, { "from": "gpt", "value": "Point (0.325, 0.436) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2990ed2d5b16bbf2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person needing to park your motorcycle on the street. The image shows a metallic teal motorcycle at center and a gray concrete curb at lower left. Is the motorcycle currently parked on the curb?" }, { "from": "gpt", "value": "The metallic teal motorcycle at center is positioned over gray concrete curb at lower left, so yes, the motorcycle is parked on the curb." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ab9a90535e125e5.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a smooth strawberry ice cream at upper right. Pinpoint a point to the smooth strawberry ice cream at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.821, 0.423)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1b2a747973ea629.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the floral fabric dress at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.043, 0.673)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82d293a7200861e2.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.730, 0.639) or point (0.087, 0.739)?" }, { "from": "gpt", "value": "Point (0.730, 0.639)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cceab5689d58737.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.509, 0.664) and camera?" }, { "from": "gpt", "value": "Point (0.509, 0.664) is 23.47 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68e9474ae2bddc0d.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of charred wood pile at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.387, 0.578)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9cb5fde5ca025b4.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in a forest and want to reach a specific point marked at coordinates point (0.463, 0.622). How far is this point from you?" }, { "from": "gpt", "value": "The point (0.463, 0.622) is 70.47 meters away from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2651b65d24147fb6.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the weathered wood log at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.509, 0.487)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23ad3291c42a099a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if knitted wool hat at left is bigger than black matte goggles at center?" }, { "from": "gpt", "value": "Indeed, knitted wool hat at left has a larger size compared to black matte goggles at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9336be99382d0aa7.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green matte t-shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.718, 0.467)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d949d9f68e11e6a0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer entering the store and see the metallic sign at upper left and the black plastic number at upper left. Which one is wider?" }, { "from": "gpt", "value": "The metallic sign at upper left is wider than the black plastic number at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/978cf4dd03892ee2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who has just arrived at the forest clearing. You see the green water at center and the brown rough tree at left. Which object is positioned to the right of the other?" }, { "from": "gpt", "value": "The green water at center is positioned to the right of the brown rough tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6defba526c0c5242.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.172, 0.867) from camera?" }, { "from": "gpt", "value": "A distance of 2.34 meters exists between point (0.172, 0.867) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3918230305ff1cd8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a gardener who needs to water the green matte plant at center. The black plastic tray at center is currently empty. Where should you pour water to ensure the plant gets enough moisture without overwatering?" }, { "from": "gpt", "value": "You should pour water directly onto the soil around the green matte plant at center. Since the black plastic tray at center is larger, it can collect excess water, preventing overwatering while allowing the plant to absorb what it needs." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01912a95b2533bf1.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, transparent glass wine glass at lower center or translucent glass wine at center?" }, { "from": "gpt", "value": "From the viewer's perspective, transparent glass wine glass at lower center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0437e6ed1b7767a3.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of blue painted metal train at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.210, 0.331)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a0bb919df99d034.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at lower left is positioned above green leafy tree at center?" }, { "from": "gpt", "value": "No, green leafy tree at lower left is not above green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd78f1a5db0be10b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the gray cotton t-shirt at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.799, 0.845)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b1947ef07d7848b.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance measurement between light brown rough wood at center and gray rough rock at center?" }, { "from": "gpt", "value": "They are 20.86 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e326e74d2fb78eef.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.112, 0.686) come farther from viewer compared to point (0.465, 0.666)?" }, { "from": "gpt", "value": "No, it is in front of (0.465, 0.666)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5eecb69647edb707.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy field at lower center taller than green leafy tree at upper left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f012472554cf304.jpg", "conversations": [ { "from": "human", "value": "\nPoint to gray heathered t-shirt at center.Point to the gray heathered t-shirt at center in the image." }, { "from": "gpt", "value": "[(0.544, 0.492)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e92fa3add56bf99c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of black matte shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.482, 0.670)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf73012e923012b8.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the clear water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.349, 0.744)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40ee2edaa4d6ac4a.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance from gray stone at center to white marble gravestone at center." }, { "from": "gpt", "value": "They are 17.64 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e36203115143e0d6.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of white powdery snow at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.431, 0.897)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afe0565086ab37d9.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.783, 0.794) or (0.829, 0.520)?" }, { "from": "gpt", "value": "Point (0.829, 0.520)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6148d1e446d69e25.jpg", "conversations": [ { "from": "human", "value": "\nLocate the matte red bus at center in the image." }, { "from": "gpt", "value": "[(0.713, 0.523)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b22d227b98ce6dce.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear water at center is smaller than smooth gray rock at center?" }, { "from": "gpt", "value": "No, clear water at center is not smaller than smooth gray rock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db210932afac681b.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the distance between glossy black table at center and red plastic chair at center?" }, { "from": "gpt", "value": "glossy black table at center is 14.89 inches away from red plastic chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e46795026b32f2b.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.500, 0.270)?" }, { "from": "gpt", "value": "smooth concrete buildings at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab5830ec037cf0b0.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.784, 0.512) or (0.133, 0.573)?" }, { "from": "gpt", "value": "Point (0.784, 0.512) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ad69326023b94fa.jpg", "conversations": [ { "from": "human", "value": "\nBetween clear water at center and brown sandy beach at lower center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "brown sandy beach at lower center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e78c9110d91425d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray sand at center is positioned below brown bark tree at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a00803504ed93954.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a brown woolen goat at center. Pinpoint a point to the brown woolen goat at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.399, 0.487)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7dd8f1f7459ce3bc.jpg", "conversations": [ { "from": "human", "value": "\nDoes white paper sign at upper center appear under green plastic street sign at upper center?" }, { "from": "gpt", "value": "Indeed, white paper sign at upper center is positioned under green plastic street sign at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa33dc473d4fc662.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.683, 0.141) closer to viewer compared to point (0.160, 0.680)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11ecc42d6ed4d4f6.jpg", "conversations": [ { "from": "human", "value": "\nHow far is clear water at beach center from camera?" }, { "from": "gpt", "value": "clear water at beach center is 16.11 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7507f337f864453c.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of dark grass at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.490, 0.834)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b152e3130c97b5b1.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, blue water at lower center or metallic gray ship at right?" }, { "from": "gpt", "value": "From the viewer's perspective, blue water at lower center appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9963827645de8d66.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at a point and want to reach the foreground pigeon standing near a discarded peanut shell. The coordinates of your current position are point (0.292, 0.661). How far do you need to walk to reach the pigeon?" }, { "from": "gpt", "value": "The distance between point (0.292, 0.661) and the foreground pigeon is 9.17 feet, so you need to walk 9.17 feet to reach the pigeon." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1e64ab013d64eb6.jpg", "conversations": [ { "from": "human", "value": "\nIs orange metallic excavator at center in front of green fabric construction worker at center?" }, { "from": "gpt", "value": "Yes, it is in front of green fabric construction worker at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80df85d5de4185e9.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator flying at an altitude of 1000 meters. You need to capture a clear photo of the green leafy forest at center. Is the drone within the required 700 meters distance to take the photo?" }, { "from": "gpt", "value": "The distance of green leafy forest at center from camera is 661.01 meters, which is within the 700 meters requirement. The drone can capture the photo clearly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06ff4cd5af4b0b8c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer planning to capture a landscape shot of the turquoise glossy water at center and green leafy trees at center. Based on their positions, which object will appear closer to the camera in the final photo?" }, { "from": "gpt", "value": "The turquoise glossy water at center will appear closer to the camera in the final photo because it is positioned in front of the green leafy trees at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d16a2cee8fcda163.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer positioned at the edge of the water. You want to capture a photo of the white matte camel at center and the green painted wood boat at lower left in the same frame. Which object should you position closer to the left side of your camera viewfinder to include both in the shot?" }, { "from": "gpt", "value": "The green painted wood boat at lower left is to the left of the white matte camel at center, so you should position the green painted wood boat at lower left closer to the left side of your camera viewfinder to include both in the shot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6675f10476abdf2.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.459, 0.433) lie behind point (0.672, 0.273)?" }, { "from": "gpt", "value": "No, (0.459, 0.433) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1bc31c11962ad778.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the dark brown hair at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.809, 0.628)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/646069d0303eda07.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of gray marble pillar at center in the image." }, { "from": "gpt", "value": "[(0.451, 0.336)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdddf866b6d84bf0.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green plastic road sign at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.508, 0.581)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6e27e88c3d8ba89.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a transparent plastic airplane window at upper center. Pinpoint a point to the transparent plastic airplane window at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.329, 0.150)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11dcac7ff66f4c16.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the white-spotted fur at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.778, 0.516)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86a69746a156e019.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of black and white crochet at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.478, 0.872)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad2b73c2f6e8a4c9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if stainless steel refrigerator at right is positioned above silver metallic toaster at left?" }, { "from": "gpt", "value": "Incorrect, stainless steel refrigerator at right is not positioned above silver metallic toaster at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71a2bfcf55938b0e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who just arrived at a furniture store. You need to place a new sofa that is 7 feet long into the space between the brown leather couch at left and the wooden table at center. Can you fit the new sofa there?" }, { "from": "gpt", "value": "The distance between the brown leather couch at left and the wooden table at center is 6.70 feet. Since the new sofa is 7 feet long, it will not fit in the available space as it is slightly longer than the distance between them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4de991d2ca58e8f4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if camouflage uniform at center is positioned above black matte suit at center?" }, { "from": "gpt", "value": "Yes, camouflage uniform at center is above black matte suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5e4f720a69c4253.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray asphalt driveway at lower center is shorter than white matte window at upper right?" }, { "from": "gpt", "value": "Correct, dark gray asphalt driveway at lower center is not as tall as white matte window at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/507fd1654a406b40.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.469, 0.508)?" }, { "from": "gpt", "value": "blue water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85ced914c199f266.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from dark gray sweater at left to camera." }, { "from": "gpt", "value": "96.55 centimeters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b315d663124bcea.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green leafy plant at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.044, 0.686)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b145ed7d3164783f.jpg", "conversations": [ { "from": "human", "value": "\nWhere is gray matte shirt at left located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.176, 0.662)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c93005b140d41653.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of polished black horse at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.359, 0.586)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/648762540a65fa34.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between matte pink dress at center and pink fabric dress at center." }, { "from": "gpt", "value": "9.93 inches" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00deb2e319774278.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.681, 0.798) or (0.657, 0.530)?" }, { "from": "gpt", "value": "Point (0.681, 0.798)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0024f95408673971.jpg", "conversations": [ { "from": "human", "value": "\nBetween linen green blazer at right and brown wooden picnic table at center, which one has more height?" }, { "from": "gpt", "value": "Standing taller between the two is linen green blazer at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb8be7224914280b.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.696, 0.619) and point (0.943, 0.395), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.696, 0.619)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6221e48787951041.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the group photo at the formal event. There is a point marked at coordinates (0.508, 0.702). What object in the photo is located at this point?" }, { "from": "gpt", "value": "The point at (0.508, 0.702) corresponds to the white satin blazer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2996f0434ec737d5.jpg", "conversations": [ { "from": "human", "value": "\nIs green wood ramp at lower center thinner than green wooden fence at lower right?" }, { "from": "gpt", "value": "Indeed, green wood ramp at lower center has a lesser width compared to green wooden fence at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8f136aa4b8f7745.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to drive the shiny blue truck at center under a low bridge. The yellow concrete curb at lower center is at the same height as the bridge. Will the truck fit under the bridge?" }, { "from": "gpt", "value": "The shiny blue truck at center is much taller than the yellow concrete curb at lower center, so it will not fit under the bridge which is at the same height as the curb." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f027e6ea7acf3a4c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of blue fabric jacket at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.298, 0.575)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ffb2c702641cc30.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, brown gravel at center or smooth skin legs at center?" }, { "from": "gpt", "value": "Positioned lower is brown gravel at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f5441187db6337d.jpg", "conversations": [ { "from": "human", "value": "\nHow close is gray concrete tarmac at center from dark blue uniform at center?" }, { "from": "gpt", "value": "gray concrete tarmac at center is 4.75 meters from dark blue uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00baac6c1ac34c31.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.556, 0.611)." }, { "from": "gpt", "value": "dark gray sleeveless tank top at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/349cfb90bcf8ed28.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green matte t-shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.621, 0.608)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a261c08781b14fd.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy trees at center come behind green leafy tree at upper right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a8734a360869d4b.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of multicolored painted totem pole at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.342, 0.434)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42d25e5e280488b0.jpg", "conversations": [ { "from": "human", "value": "\nHow close is jeans at center from camera?" }, { "from": "gpt", "value": "jeans at center is 3.51 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0642791b44bb3de5.jpg", "conversations": [ { "from": "human", "value": "\nYou are arranging flowers in the bedroom and need to place a bouquet that requires a stable, elevated surface. Which object between the velvet burgundy pillow at center and the blue glossy headboard at upper right would be more suitable for placing the bouquet?" }, { "from": "gpt", "value": "The blue glossy headboard at upper right is taller than the velvet burgundy pillow at center, making it a more suitable elevated surface for placing the bouquet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62dbf7d047b4d7b5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer planning to capture the white wood church at center and the shiny copper spire at upper center in a single frame. Which object will occupy more horizontal space in the photo?" }, { "from": "gpt", "value": "The white wood church at center will occupy more horizontal space in the photo since its width surpasses that of the shiny copper spire at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bb7f848113ebdd5.jpg", "conversations": [ { "from": "human", "value": "\nLocate the blue fabric couch at center in the image." }, { "from": "gpt", "value": "[(0.809, 0.731)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b1faf9bf4b97108.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between green grass at center and camera?" }, { "from": "gpt", "value": "green grass at center and camera are 10.87 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc15301a7636a992.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.507, 0.591) lie behind point (0.466, 0.603)?" }, { "from": "gpt", "value": "No, (0.507, 0.591) is in front of (0.466, 0.603)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/347b0e345b932883.jpg", "conversations": [ { "from": "human", "value": "\nIs brown leather chair at left to the left of brown leather chair at center from the viewer's perspective?" }, { "from": "gpt", "value": "Yes, brown leather chair at left is to the left of brown leather chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/254badcbc728715b.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of gray asphalt pavement at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.571, 0.820)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ff0ba199f1a2780.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is black matte shirt at center from camera?" }, { "from": "gpt", "value": "3.44 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d57af9119aa31028.jpg", "conversations": [ { "from": "human", "value": "\nLocate blue water at center in the image." }, { "from": "gpt", "value": "[(0.444, 0.745)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/590b204667c37a93.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, wooden stairs at center or beige stone building at upper center, stands taller?" }, { "from": "gpt", "value": "beige stone building at upper center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/875c702c98b2bf5e.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of green wood rocking chair at center right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.821, 0.430)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bfec98d2f0a7fd7.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.780, 0.573) or (0.450, 0.539)?" }, { "from": "gpt", "value": "Positioned behind is point (0.450, 0.539)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2cffae6784e8440c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.417, 0.564) or point (0.983, 0.664)?" }, { "from": "gpt", "value": "Positioned behind is point (0.417, 0.564)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be2d08cb4293d9e4.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of smooth skin torso at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.351, 0.609)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8b5173b822eb254.jpg", "conversations": [ { "from": "human", "value": "\nDoes light blue checkered shirt at center have a greater height compared to dark blue sweater at center?" }, { "from": "gpt", "value": "In fact, light blue checkered shirt at center may be shorter than dark blue sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/454067b262d5f5d8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to navigate through the street scene. You see two points marked on the ground at coordinates point (0.792, 0.586) and point (0.442, 0.653). Which point is closer to the sidewalk where the man is sitting?" }, { "from": "gpt", "value": "Point (0.792, 0.586) is in front of point (0.442, 0.653), so it is closer to the sidewalk where the man is sitting." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d736efdfd110bdc1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the birthday party. You need to take a photo of the white matte plate at center without including the striped cotton shirt at lower left. Is the shirt currently in the frame of the plate?" }, { "from": "gpt", "value": "The striped cotton shirt at lower left is below the white matte plate at center, so it is in the frame of the plate. To exclude the shirt, adjust the camera angle upwards or move the shirt." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b17c6579f6c5e473.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.055, 0.084) and point (0.875, 0.211), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.875, 0.211)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6732b82c935445b9.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.290, 0.463) in front of point (0.253, 0.575)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21a8fbf293834ec5.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any shiny brown leather sandals at center in the image." }, { "from": "gpt", "value": "[(0.413, 0.283)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bbc4ccb34730206.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the lakeside and see the white glossy boat at left. If you want to walk to the boat, how far do you need to walk?" }, { "from": "gpt", "value": "The white glossy boat at left is 24.01 meters away from you, so you need to walk 24.01 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34e088cfe545294e.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of green matte shirt at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.721, 0.514)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ab52c836553c68e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.326, 0.863) more distant than point (0.315, 0.997)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89a0dfc6892080fc.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.995, 0.887) positioned in front of point (0.700, 0.484)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.700, 0.484)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/856e001cbf6b05bd.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of shiny black tiles at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.462, 0.255)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae9cf1c9fb66e751.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.754, 0.070) farther from viewer compared to point (0.218, 0.605)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.218, 0.605)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0df38f8db1cc07b.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of brown dirt track at lower left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.501, 0.848)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a48972ebceed45e5.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.521, 0.333)." }, { "from": "gpt", "value": "rubber balloons at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9895d0013de09416.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the living room and want to place a small decorative item exactly at the point marked as point (0.627, 0.911). If your arm reaches out 1.2 meters, can you comfortably place the item there without moving closer?" }, { "from": "gpt", "value": "The distance of point (0.627, 0.911) from viewer is 1.36 meters, so since your arm only reaches 1.2 meters, you would need to move closer to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f609d16c5de06f9.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte red poster at left and blue cotton t-shirt at right, which one has less height?" }, { "from": "gpt", "value": "With less height is blue cotton t-shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a873c6339ecb2156.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white cotton shirt at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.057, 0.381)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54e76c7ed5805f14.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.565, 0.458)?" }, { "from": "gpt", "value": "brown stone sculpture at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/263ab5ebe91e5e87.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.858, 0.284) or (0.487, 0.553)?" }, { "from": "gpt", "value": "Positioned behind is point (0.858, 0.284)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18bca6caec1bd17c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if rough stone ledge at center is positioned below white smooth shirt at center?" }, { "from": "gpt", "value": "Correct, rough stone ledge at center is located below white smooth shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2af8fa348426076.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.419, 0.927) closer to camera compared to point (0.552, 0.870)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a78f7742de5a9a49.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the base of the green leafy tree at center and want to throw a rock to hit a target 50 meters away. Will you be able to reach the target with one throw?" }, { "from": "gpt", "value": "The target is 50 meters away, and the maximum distance you can throw is 48.49 meters, so you cannot reach the target with one throw." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a680aeb938be7ce.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist who needs to place a protective cover over the shiny dark red armor at center and the shiny metallic dragon at center. Which object should you cover first to avoid blocking the view of the one above?" }, { "from": "gpt", "value": "You should cover the shiny metallic dragon at center first because the shiny dark red armor at center is below it, so covering the dragon first will prevent blocking the armor below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b52329cc3a1c7c2.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.971, 0.630) come behind point (0.772, 0.680)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e389684e46f940b.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue plastic bucket at lower right appear on the left side of light blue denim jacket at center?" }, { "from": "gpt", "value": "In fact, blue plastic bucket at lower right is to the right of light blue denim jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5f64d7a96e0eba2.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of clear glass window at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.934, 0.414)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42157e2936df38db.jpg", "conversations": [ { "from": "human", "value": "\nLocate green leafy tree at center in the image." }, { "from": "gpt", "value": "[(0.478, 0.181)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9c3dd0162d1e1c1.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.985, 0.375) or (0.089, 0.930)?" }, { "from": "gpt", "value": "Point (0.985, 0.375)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b16a5053b8a4eb5.jpg", "conversations": [ { "from": "human", "value": "\nYou are an art curator planning to display both the black polished cross at center and the polished bronze crucifix at center in a gallery. Given their sizes, which one would require more space for proper display?" }, { "from": "gpt", "value": "The black polished cross at center is bigger than the polished bronze crucifix at center, so it would require more space for proper display." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4c488161803f599.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of green metallic fence at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.742, 0.134)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f7b527845a5132b.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth water at center lie in front of wooden boat at lower right?" }, { "from": "gpt", "value": "No, smooth water at center is behind wooden boat at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99ef0f58638f8618.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange t-shirt at center come in front of khaki cotton shorts at lower right?" }, { "from": "gpt", "value": "Yes, orange t-shirt at center is in front of khaki cotton shorts at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b236fb5b3032474.jpg", "conversations": [ { "from": "human", "value": "\nPoint to teal fabric boat at center.Point to the teal fabric boat at center in the image." }, { "from": "gpt", "value": "[(0.386, 0.944)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efd768a4ccdafda7.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the smooth sandstone cliff at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.547, 0.256)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c444d2628caaa67d.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.734, 0.642) from camera?" }, { "from": "gpt", "value": "Point (0.734, 0.642) is 3.87 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58b07f86fb896378.jpg", "conversations": [ { "from": "human", "value": "\nIs clear water at center positioned before metallic gray crane at center right?" }, { "from": "gpt", "value": "Yes, clear water at center is in front of metallic gray crane at center right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/597f580dff99a44e.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the gold metallic convertible at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.482, 0.614)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d1b8e500a3f5dc7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black suit at center is thinner than white paper at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3cc97055271c3860.jpg", "conversations": [ { "from": "human", "value": "\nBetween metallic power line at upper center and green leafy tree at center, which one is positioned lower?" }, { "from": "gpt", "value": "green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df791fdc6f240819.jpg", "conversations": [ { "from": "human", "value": "\nDoes green mossy log at center have a larger size compared to green mossy tree at upper center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ef808de80a77eae.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the wooden shoe rack at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.755, 0.658)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6bd02ce3592d898.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the showroom and see two points marked on the floor. The first point is at point (0.284, 0.445) and the second point is at point (0.762, 0.377). Which point is closer to you?" }, { "from": "gpt", "value": "Point (0.284, 0.445) is in front of point (0.762, 0.377), so it is closer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94f096d21f7f7071.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.095, 0.809) from camera?" }, { "from": "gpt", "value": "Point (0.095, 0.809) is 5.34 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/866cc4a36a268fb7.jpg", "conversations": [ { "from": "human", "value": "\nDoes greenish water at center appear on the left side of black wood paddle at center?" }, { "from": "gpt", "value": "Incorrect, greenish water at center is not on the left side of black wood paddle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31bfd2e438fc124c.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.748, 0.542) or (0.953, 0.675)?" }, { "from": "gpt", "value": "The point (0.748, 0.542) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfc7fde6d157cd4a.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.206, 0.637) and camera?" }, { "from": "gpt", "value": "They are 6.61 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67046e4b155fdc4e.jpg", "conversations": [ { "from": "human", "value": "\nLocate all matte black monitor at left in the image." }, { "from": "gpt", "value": "[(0.271, 0.645)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b895a6d3f742fd2.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a wooden stairs at center. Pinpoint a point to the wooden stairs at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.423, 0.786)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/014dc8d047641390.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.388, 0.795)?" }, { "from": "gpt", "value": "yellow asphalt highway at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39d9fa55ec727328.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.147, 0.688) or (0.375, 0.838)?" }, { "from": "gpt", "value": "Point (0.147, 0.688)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/291d62e330caa6f3.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.334, 0.648) come behind point (0.414, 0.578)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d619147bb2beecc.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the beige stone building at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.488, 0.562)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3612148a27a105a4.jpg", "conversations": [ { "from": "human", "value": "\nDoes light blue cotton shirt at center have a smaller size compared to white matte shirt at right?" }, { "from": "gpt", "value": "No, light blue cotton shirt at center is not smaller than white matte shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd879283f74f8033.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.583, 0.533) come in front of point (0.869, 0.222)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94941cea2bd7ea3e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a fashion designer observing the scene. You need to determine which clothing item has a greater width between the black matte shirt at center and the purple fleece hoodie at left. Based on the description, which one is wider?" }, { "from": "gpt", "value": "The black matte shirt at center is wider than the purple fleece hoodie at left according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1504943dc3ea1bb7.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the light gray shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.769, 0.750)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0253830f937ad9f0.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, brown cardboard box at right or white matte bottle at left?" }, { "from": "gpt", "value": "white matte bottle at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/270c2bd93a01cf26.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the blue cotton shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.571, 0.670)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b208c2fc04a6922c.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.836, 0.552) and camera?" }, { "from": "gpt", "value": "Point (0.836, 0.552) and camera are 3.50 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/294ac304c8cd8b8a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, wooden at right or brown spotted giraffe at lower right, stands shorter?" }, { "from": "gpt", "value": "With less height is wooden at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3eabc31aa9612a87.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.692, 0.556)?" }, { "from": "gpt", "value": "Point (0.692, 0.556) and camera are 4.10 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2cae954f549b58b5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the point marked as point (0.569, 0.341). You want to capture a photo of the soccer match. The camera you are using has a focal length of 50mm and a sensor size of 24mm. What is the distance between you and the camera to ensure the entire soccer field fits in the frame?" }, { "from": "gpt", "value": "The distance between the photographer at point (0.569, 0.341) and the camera is 9.85 meters. To ensure the entire soccer field fits in the frame, the photographer should maintain this distance of 9.85 meters from the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc76f6282c8b60a4.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at upper center have a greater height compared to green polished dome at upper left?" }, { "from": "gpt", "value": "Correct, green leafy tree at upper center is much taller as green polished dome at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49e0b5e123ebaf0f.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the golden brown fur at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.712, 0.636)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ecf2e02fc112dce5.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of gray fluffy cat at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.774, 0.606)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f96fc3331d976fd.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.960, 0.886) or point (0.504, 0.531)?" }, { "from": "gpt", "value": "The point (0.504, 0.531) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0dd26d2bdea24739.jpg", "conversations": [ { "from": "human", "value": "\nHow far is smooth granite water at center from camera?" }, { "from": "gpt", "value": "smooth granite water at center and camera are 41.88 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b00461378a2d32d.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the bathroom and need to place a new item between the two points marked as point (0.492, 0.720) and point (0.300, 0.223). Which point should you place it closer to so that it remains in front of the other point?" }, { "from": "gpt", "value": "You should place the new item closer to point (0.492, 0.720) so that it remains in front of point (0.300, 0.223) since point (0.492, 0.720) is already in front of point (0.300, 0.223)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34ffe8979a268818.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.276, 0.619) come behind point (0.217, 0.600)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/310676b99601fd16.jpg", "conversations": [ { "from": "human", "value": "\nBetween smooth concrete sidewalk at lower center and gray uniform at center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "smooth concrete sidewalk at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86ebf86107b3c06f.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to white vapor at center? Please provide its 2D coordinates.Where can I find white vapor at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.736, 0.356)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/849783bbd0217531.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer taking a picture of the stage. You notice the white matte chef hat at center and the shiny brown coat at center. Which object should you focus on first if you want to capture the taller one?" }, { "from": "gpt", "value": "You should focus on the shiny brown coat at center first because it is taller than the white matte chef hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de6114ce05109277.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the dark blue fabric at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.414, 0.511)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3d5cc2505ee3ae5.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.650, 0.811) and camera?" }, { "from": "gpt", "value": "A distance of 1.88 meters exists between point (0.650, 0.811) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04660dc77d47a4ca.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.815, 0.909) closer to viewer compared to point (0.537, 0.334)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e562863c147997c4.jpg", "conversations": [ { "from": "human", "value": "\nYou are an observer looking at the landscape. Which object, the dark gray cloud at upper center or the green matte tree at center, occupies a bigger area in the scene?" }, { "from": "gpt", "value": "The dark gray cloud at upper center has a larger size compared to the green matte tree at center, so it occupies a bigger area in the scene." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fff573d9218a28c.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.202, 0.361) or (0.425, 0.980)?" }, { "from": "gpt", "value": "Positioned in front is point (0.202, 0.361)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc3380a5cff8e7b0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and want to capture a photo that includes both the blue cotton shirt at center and the black fabric shirt at left. Considering their heights, which shirt will appear taller in the photo?" }, { "from": "gpt", "value": "The blue cotton shirt at center will appear taller in the photo since it has a greater height compared to the black fabric shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44eba81f97a08f8b.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.408, 0.591) and point (0.727, 0.347), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.727, 0.347)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b1087e105af779f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the front row of the event hall and notice a person with matte black hair at left. If you look straight ahead, will the banners on the back wall block your view of their hair?" }, { "from": "gpt", "value": "The banners on the back wall are positioned behind the stage area, and the matte black hair at left is located at point (0.039, 0.537). Since the banners are on the back wall and the person with matte black hair is in the foreground, their hair would be in front of the banners. Therefore, the banners would not block your view of the matte black hair at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/897604265c1dc5b4.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte window sill at center have a greater height compared to metallic silver camera at right?" }, { "from": "gpt", "value": "Yes, white matte window sill at center is taller than metallic silver camera at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/279b9f0c1bd153f3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.297, 0.658) or point (0.741, 0.811)?" }, { "from": "gpt", "value": "The point (0.741, 0.811) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbeb1576f67bdf9c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the riverside dock and see the blue smooth water at center and the wooden boat at center. Which one appears bigger in the image?" }, { "from": "gpt", "value": "The blue smooth water at center is larger in size than the wooden boat at center, so the blue smooth water at center appears bigger." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0701f96e3a937674.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the rusty metal pole at center without the matte fabric flag at upper center blocking it. Is this possible given their positions?" }, { "from": "gpt", "value": "The rusty metal pole at center is behind the matte fabric flag at upper center, so it is already blocked by the flag. Therefore, capturing the pole without the flag blocking it would not be possible with their current positions." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/131e445aebb8ee3d.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.531, 0.666) from camera?" }, { "from": "gpt", "value": "A distance of 11.75 feet exists between point (0.531, 0.666) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/748eb359b726d6e0.jpg", "conversations": [ { "from": "human", "value": "\nHow close is green leafy tree at center from camera?" }, { "from": "gpt", "value": "green leafy tree at center and camera are 271.85 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1a033184fffdc65.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white marble tower at upper left is positioned above green leafy tree at lower center?" }, { "from": "gpt", "value": "Indeed, white marble tower at upper left is positioned over green leafy tree at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4466ee63f21a9883.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of matte khaki shorts at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.847, 0.477)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf654fa92239a4de.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, dark suit jacket at center or dark hair at center?" }, { "from": "gpt", "value": "dark suit jacket at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14c9bab344306bb9.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.567, 0.289) and want to take a photo of the waterfall. If your camera is 107.60 feet away from you, will you be able to capture the entire waterfall in the photo?" }, { "from": "gpt", "value": "Yes, since the camera is 107.60 feet away from point (0.567, 0.289), you can capture the entire waterfall in the photo as the distance allows the camera to encompass the whole scene." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23e3e503058c7238.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.474, 0.956) come in front of point (0.398, 0.547)?" }, { "from": "gpt", "value": "Yes, point (0.474, 0.956) is in front of point (0.398, 0.547)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e955bf4336a5560.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer planning to capture the cenote from a specific vantage point. You notice the clear glass water at center and the green leafy tree at center. Which object will appear closer to the camera in your photo?" }, { "from": "gpt", "value": "The clear glass water at center will appear closer to the camera because it is positioned in front of the green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed25882f663e2d62.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte white shirt at center appear on the left side of pink satin dress at left?" }, { "from": "gpt", "value": "In fact, matte white shirt at center is to the right of pink satin dress at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b4bd4e010a6487b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, concrete rubble at center or dark brown hair at lower center?" }, { "from": "gpt", "value": "Positioned to the left is dark brown hair at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7ee96292b4718f0.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the waterfront facing the historic building. You notice two points marked on the scene. The first point is at coordinates point (0.390, 0.256) and the second is at point (0.252, 0.777). Which point is closer to you?" }, { "from": "gpt", "value": "Point (0.390, 0.256) is further to the camera than point (0.252, 0.777), so the point closer to you is point (0.252, 0.777)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d433aee053c4ba33.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.232, 0.463) come behind point (0.377, 0.984)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3814fd7431ec1c1a.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance measurement between matte black jacket at left and black fabric pavement at left?" }, { "from": "gpt", "value": "matte black jacket at left and black fabric pavement at left are 4.88 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf41e1a0217b9f8f.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a light gray sweater at center. Pinpoint a point to the light gray sweater at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.706, 0.736)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3cb3e8a1d5ad2801.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark brown suit at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.528, 0.778)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cf4956febb5836d.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte brown leather jacket at upper center appear on the right side of matte black nose at upper center?" }, { "from": "gpt", "value": "Incorrect, matte brown leather jacket at upper center is not on the right side of matte black nose at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a292248bb2bffb3d.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of matte blue dress at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.699, 0.675)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e25b2834b5312b1a.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between wooden computer desk at center and camera." }, { "from": "gpt", "value": "wooden computer desk at center and camera are 1.40 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5120981ebef3e86f.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of smooth stone tower at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.499, 0.336)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19b1720445b6bb8a.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the matte blue shirt at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.254, 0.539)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69da81928dd40c4b.jpg", "conversations": [ { "from": "human", "value": "\nDoes beige paper money at center have a larger size compared to gray paper currency at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/018f992754da53e8.jpg", "conversations": [ { "from": "human", "value": "\nIs dark wood door at center shorter than terracotta textured pot at lower right?" }, { "from": "gpt", "value": "No, dark wood door at center is not shorter than terracotta textured pot at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3693fd244b7960a.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray shirt at center bigger than dark gray sweater at center?" }, { "from": "gpt", "value": "Indeed, dark gray shirt at center has a larger size compared to dark gray sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa387650fef1955b.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent glass window at center to the right of black fabric curtain at center from the viewer's perspective?" }, { "from": "gpt", "value": "Yes, transparent glass window at center is to the right of black fabric curtain at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e36a1b439463cd99.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.836, 0.477) lie in front of point (0.325, 0.391)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.325, 0.391)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/309470ff4d4ead57.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center taller than silver metallic truck at left?" }, { "from": "gpt", "value": "Indeed, green leafy tree at center has a greater height compared to silver metallic truck at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d96d87303b43c41f.jpg", "conversations": [ { "from": "human", "value": "\nIs brown stone stairs at center bigger than tan fabric shorts at center?" }, { "from": "gpt", "value": "Correct, brown stone stairs at center is larger in size than tan fabric shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5acca1f4330d9707.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the DJ table in the foreground of the scene. You need to locate the pink matte shirt at center. According to the coordinates provided, where should you look relative to your position?" }, { "from": "gpt", "value": "The pink matte shirt at center is located at coordinates point (0.793, 0.534), which means it is positioned slightly to the right and lower from the center of the scene." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a606fbaee70de22.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a black beaded hijab at upper right. Pinpoint a point to the black beaded hijab at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.876, 0.281)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81c26591e115357c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.726, 0.383) or point (0.265, 0.378)?" }, { "from": "gpt", "value": "Positioned behind is point (0.265, 0.378)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d798b4acbb0b5df9.jpg", "conversations": [ { "from": "human", "value": "\nBetween maroon jersey at lower center and light brown hair at lower left, which one has less height?" }, { "from": "gpt", "value": "With less height is maroon jersey at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a4c5b752f0d8a42.jpg", "conversations": [ { "from": "human", "value": "\nDoes green fuzzy hat at upper center have a smaller size compared to matte black shirt at left?" }, { "from": "gpt", "value": "Actually, green fuzzy hat at upper center might be larger than matte black shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5e5ad3e98161f81.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between brown hair at lower center and black sweater at right." }, { "from": "gpt", "value": "brown hair at lower center and black sweater at right are 9.07 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7428ededcd5748c8.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.923, 0.823) lie in front of point (0.578, 0.336)?" }, { "from": "gpt", "value": "Yes, point (0.923, 0.823) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5de22590c46f0ec6.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of clear glassy water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.476, 0.662)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/197948a20c95bc37.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white matte terrace at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.423, 0.459)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d2f3e7aab7558e2.jpg", "conversations": [ { "from": "human", "value": "\nLocate the white painted wood boat at center in the image." }, { "from": "gpt", "value": "[(0.375, 0.914)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83c3ad95ea7b5a19.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of matte black jacket at left from camera?" }, { "from": "gpt", "value": "They are 3.95 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1dd2827ad5d2eed4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer adjusting the focus on a camera. The subject is the white matte kandura at center, and you want to ensure the curly brown hair at center is also in focus. Given the current depth of field, can you estimate if both will be sharp?" }, { "from": "gpt", "value": "The distance between the white matte kandura at center and curly brown hair at center is 7.49 inches. Since they are only 7.49 inches apart, and the depth of field is shallow, it is likely that both will be in focus if they are within the same focal plane. However, the photographer should check the focus settings to ensure the entire distance is covered." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7188c181af400edd.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.007, 0.711) positioned in front of point (0.387, 0.662)?" }, { "from": "gpt", "value": "Yes, point (0.007, 0.711) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/816796a154d0ba2a.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between green moss-covered mound at left and camera." }, { "from": "gpt", "value": "A distance of 52.75 feet exists between green moss-covered mound at left and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/699256fbdbd4840a.jpg", "conversations": [ { "from": "human", "value": "\nBetween yellow matte building at center and white matte van at lower right, which one has more height?" }, { "from": "gpt", "value": "With more height is yellow matte building at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88474d9b06034da4.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, white feathered duck at center or orange glossy beak at upper right?" }, { "from": "gpt", "value": "white feathered duck at center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b03da75a135e46f.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.016, 0.680) positioned before point (0.837, 0.169)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.837, 0.169)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5b8174440f32095.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue cotton candy at center is thinner than chocolate cake at left?" }, { "from": "gpt", "value": "No, blue cotton candy at center is not thinner than chocolate cake at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4da6bc3041d2b0a1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver who needs to park your vehicle between the white matte suv at center and the shiny black car at lower left. Is there enough space between them to fit your car, which is 4.5 meters long?" }, { "from": "gpt", "value": "The white matte suv at center is positioned on the right side of the shiny black car at lower left. However, the exact distance between them isn not provided in the scene description. Therefore, it is impossible to determine if there is enough space to fit a 4.5 meter car between them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1485104e5438f22b.jpg", "conversations": [ { "from": "human", "value": "\nPlease describe the position of the yellow matte cheese at center in relation to the other items on the table in the image." }, { "from": "gpt", "value": "The yellow matte cheese at center is located at the coordinates point (0.367, 0.927) on the table." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc68137453f79d4d.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red shirt at center closer to the viewer compared to denim jeans at upper center?" }, { "from": "gpt", "value": "Yes, matte red shirt at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea55db8cac71c6ee.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of shiny orange leaves at center from matte gray shirt at center?" }, { "from": "gpt", "value": "shiny orange leaves at center and matte gray shirt at center are 32.76 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9111ba2e7a3b20fd.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, green pine tree at upper center or green leafy tree at upper right?" }, { "from": "gpt", "value": "green pine tree at upper center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16e303d98c4f1aa1.jpg", "conversations": [ { "from": "human", "value": "\nBetween green leafy shrub at center and dark green textured mountain at left, which one has less height?" }, { "from": "gpt", "value": "With less height is green leafy shrub at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e9e761e556bd408.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte black camera at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.267, 0.561)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0266fe8cc06b1e1a.jpg", "conversations": [ { "from": "human", "value": "\nIs blue plaid shirt at left shorter than matte purple dress at right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66c6cc9f178b7d37.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear water at lower center is thinner than green textured tree at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc8c9c4ed1ad2c82.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.701, 0.562) from camera?" }, { "from": "gpt", "value": "Point (0.701, 0.562) and camera are 649.41 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/635ebf24fb33c51b.jpg", "conversations": [ { "from": "human", "value": "\nDoes green mossy stone drinking fountain at center appear over green stone drinking fountain at lower center?" }, { "from": "gpt", "value": "Actually, green mossy stone drinking fountain at center is below green stone drinking fountain at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7449aa44e9a2a28.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of a dead wood tree at center. How far are you from the tree?" }, { "from": "gpt", "value": "The dead wood tree at center is 8.09 meters from camera, so you are 8.09 meters away from the tree." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e1a50a2f6dd1722.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.774, 0.691) lie behind point (0.267, 0.055)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cc8eb1816e5a109.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the meeting room and need to move from the first point to the second point. Which direction should you move to get from point (0.088, 0.780) to point (0.604, 0.834)?" }, { "from": "gpt", "value": "To move from point (0.088, 0.780) to point (0.604, 0.834), you should move upwards and to the right because point (0.088, 0.780) is in front of point (0.604, 0.834), indicating it is closer to the viewer. Moving away from the viewer towards the back would involve going upwards and to the right in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/544262df0598e89c.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the concrete platform at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.389, 0.884)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/248739ae35d2b57a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to hand a towel to the person wearing the matte white swimsuit at upper left. Considering the distance, can you reach them without moving from your current position?" }, { "from": "gpt", "value": "The matte white swimsuit at upper left is 110.15 meters away from the camera, so you cannot reach them without moving from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b9d15c886a2a1f8.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.800, 0.717) lie behind point (0.315, 0.019)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01d048dbbb7a81b2.jpg", "conversations": [ { "from": "human", "value": "\nPoint to matte black suv at left.Point to the matte black suv at left in the image." }, { "from": "gpt", "value": "[(0.316, 0.669)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f23aac1a5363862.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the green grassy hillside at lower left and want to take a photo of the distant landscape. Your camera has a maximum focus range of 50 feet. Can you capture the landscape clearly with your current position?" }, { "from": "gpt", "value": "The distance between the green grassy hillside at lower left and the camera is 45.65 feet, which is within the camera maximum focus range of 50 feet. Therefore, you can capture the landscape clearly from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a44ede241fccd254.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.319, 0.825) or (0.754, 0.369)?" }, { "from": "gpt", "value": "Point (0.754, 0.369) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a703e2bdc2bb6495.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, matte skin eye at center or light brown skin at center?" }, { "from": "gpt", "value": "With more height is matte skin eye at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17d7e9d741e724d6.jpg", "conversations": [ { "from": "human", "value": "\nWhere is metal chain-link fence at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.512, 0.478)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60cc0fa31f1d3c31.jpg", "conversations": [ { "from": "human", "value": "\nIs orange matte container ship at center positioned behind teal painted metal pole at left?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0c5d817d1ae3f4a.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, smooth white shirt at center or metallic gray table at center?" }, { "from": "gpt", "value": "With more height is smooth white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9a2caa3b5cf1917.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a checkered shirt at left. Pinpoint a point to the checkered shirt at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.102, 0.831)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca99dae5f741f5a9.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, blue fabric at right or smooth skin face at upper left?" }, { "from": "gpt", "value": "blue fabric at right is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/199b22cb3cb39506.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green stained glass at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.112, 0.297)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2ef74507071de2f.jpg", "conversations": [ { "from": "human", "value": "\nHow distant is matte gray shirt at center from orange rubber teething ring at center?" }, { "from": "gpt", "value": "matte gray shirt at center and orange rubber teething ring at center are 17.16 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9377e28af1fcc417.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.277, 0.981) or point (0.395, 0.539)?" }, { "from": "gpt", "value": "The point (0.395, 0.539) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e83f26cff708aa21.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.168, 0.422) or (0.866, 0.492)?" }, { "from": "gpt", "value": "The point (0.866, 0.492) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b82248ee0e41c173.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer at a pizzeria and want to order the larger pizza between the red pepperoni pizza at center and the golden crispy pizza at center. Which one should you choose?" }, { "from": "gpt", "value": "The golden crispy pizza at center is larger than the red pepperoni pizza at center, so you should choose the golden crispy pizza at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf2ede4314362522.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver metallic ladder at upper left have a smaller size compared to purple fabric at upper center?" }, { "from": "gpt", "value": "No, silver metallic ladder at upper left is not smaller than purple fabric at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d79409fe3ed1ab76.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of dark blue leather jacket at lower left from camera?" }, { "from": "gpt", "value": "dark blue leather jacket at lower left is 26.58 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e793fe4a0cb6b6a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the motorsport event and want to capture a photo of the neon yellow reflective vest at center and the matte red racing suit at center. Which object should you zoom in on to ensure both are clearly visible in the frame?" }, { "from": "gpt", "value": "The neon yellow reflective vest at center has a lesser width compared to matte red racing suit at center. To ensure both are clearly visible, you should zoom in on the matte red racing suit at center since it is wider and will take up more space in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bff759c11661474.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the black matte t-shirt at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.121, 0.566)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68fe37e1f75a5eb7.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte blue t-shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.244, 0.611)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcd8ec895ed66098.jpg", "conversations": [ { "from": "human", "value": "\nHow far is purple matte flower at lower left from matte yellow flower at left?" }, { "from": "gpt", "value": "purple matte flower at lower left is 16.47 inches from matte yellow flower at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a219a7720abe14e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to take a photo of the point at coordinates point (0.609, 0.850). How far do you need to move forward or backward to be exactly 5 meters away from the point?" }, { "from": "gpt", "value": "The point (0.609, 0.850) is currently 4.56 meters away from the camera. To be exactly 5 meters away, you need to move backward by 0.44 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8e6140f2e56fc61.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of black satin suit at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.859, 0.577)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22821157e76303ec.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, brown stone tower at center or green fabric shirt at center?" }, { "from": "gpt", "value": "brown stone tower at center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8784728c2a7e1d8f.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte brown jacket at left located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.233, 0.556)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/840b45b67c3d0fa5.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.042, 0.459) or point (0.495, 0.016)?" }, { "from": "gpt", "value": "Positioned in front is point (0.042, 0.459)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fe30850af05ae5c.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue shirt at center appear under light blue shirt at lower right?" }, { "from": "gpt", "value": "Yes, dark blue shirt at center is below light blue shirt at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0cae8fdcee6849b7.jpg", "conversations": [ { "from": "human", "value": "\nDoes light brown suit at center appear over smooth green shirt at center?" }, { "from": "gpt", "value": "Incorrect, light brown suit at center is not positioned above smooth green shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2162aa3dfea10949.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.656, 0.580)?" }, { "from": "gpt", "value": "teal denim dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abb694ff5a78bda2.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the matte black cap at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.179, 0.655)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7711d8c9bdc8f452.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.411, 0.903) from camera?" }, { "from": "gpt", "value": "The distance of point (0.411, 0.903) from camera is 41.99 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b61e6403d239f20.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, black matte t-shirt at center or matte red t-shirt at center?" }, { "from": "gpt", "value": "matte red t-shirt at center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8aa2a2d05c16c536.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte letter k at center is positioned to the right of metallic gray pole at center?" }, { "from": "gpt", "value": "Indeed, black matte letter k at center is positioned on the right side of metallic gray pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a72cec1d5485dfba.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of pink cotton shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.945, 0.713)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffb446b53ca68786.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the winter forest scene and want to take a photo of the white frosty tree at center. If your camera has a focal length of 50mm, which is optimal for capturing objects at 10 meters, will you need to adjust the focal length to get the tree in focus?" }, { "from": "gpt", "value": "The white frosty tree at center is 9.53 meters from viewer, which is slightly closer than the optimal 10 meters for the 50mm focal length. You may need to adjust the focal length slightly shorter to ensure the tree is in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1a68e672a0217eb.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.750, 0.647) or point (0.505, 0.230)?" }, { "from": "gpt", "value": "Point (0.750, 0.647) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f9e5fcdd48295d3.jpg", "conversations": [ { "from": "human", "value": "\nWhere is shiny golden pineapple at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.175, 0.694)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2e1ccf659f8bec5.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any dark gray fabric jacket at center in the image." }, { "from": "gpt", "value": "[(0.345, 0.664)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/471b54dfa919d860.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a group photo. You need to position yourself so that both the matte black leg at upper left and the black matte shirt at lower right are visible in your frame. Based on their positions, where should you stand relative to the scene?" }, { "from": "gpt", "value": "You should position yourself below the scene so that the matte black leg at upper left, which is above the black matte shirt at lower right, can be captured in the frame along with the black matte shirt at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e0a47a5d4daa991.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, greenish water at center or snowy rock mountain at upper left?" }, { "from": "gpt", "value": "snowy rock mountain at upper left is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a8b33b9a6308c78.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.430, 0.677) or (0.082, 0.652)?" }, { "from": "gpt", "value": "Positioned behind is point (0.082, 0.652)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29854f926f2e429e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.140, 0.572) positioned behind point (0.206, 0.348)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3da9d77c9634ece2.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.758, 0.631) or point (0.589, 0.467)?" }, { "from": "gpt", "value": "Positioned behind is point (0.589, 0.467)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c554c469a99fc50.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer planning to take a picture of the brown dry grass at center and the wooden signboard at upper center. Which object will appear taller in the photo?" }, { "from": "gpt", "value": "The brown dry grass at center appears taller in the photo because it has a greater height compared to the wooden signboard at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd25ba871c986556.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green grass at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.311, 0.800)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8710027257f97163.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator who needs to fly your drone from the white metallic tower at center to the dark blue water at right. Based on the scene, which direction should you fly the drone to reach the water?" }, { "from": "gpt", "value": "The dark blue water at right is further to the viewer than the white metallic tower at center, so you should fly the drone towards the right side of the image to reach the water." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c41ed374f488b19c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of black suit at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.218, 0.616)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7a6930206ecd7ae.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the satin silver sedan at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.896, 0.764)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/143d6ffd5f6c4e78.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green metallic sign at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.161, 0.503)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5dac04bf19d6c8e8.jpg", "conversations": [ { "from": "human", "value": "\nDoes green needle-like tree at upper left appear under bare branches at upper right?" }, { "from": "gpt", "value": "Incorrect, green needle-like tree at upper left is not positioned below bare branches at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/733ba70737c8ee15.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the perfect shot of the green satin cape at center. Using a camera with a 50mm lens, which has a field of view of approximately 30 degrees, can you determine if the cape is within the camera frame centered at point 0.5,0.5 with a 30 degree field of view?" }, { "from": "gpt", "value": "The green satin cape at center is located at point (0.314, 0.472). Since the camera frame is centered at (0.500, 0.500) with a 30 degree field of view, the cape is within the frame as its coordinates are close to the center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c23db5d2e4a7c29.jpg", "conversations": [ { "from": "human", "value": "\nCould you measure the distance between matte gray dress at left and pink soft fabric baby at lower right?" }, { "from": "gpt", "value": "matte gray dress at left and pink soft fabric baby at lower right are 5.02 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/112b0e5b7de441ea.jpg", "conversations": [ { "from": "human", "value": "\nYou are a painter who needs to decide which object to paint first. The black wrought iron balcony at upper center and the metallic pole at left are both in need of a fresh coat. Based on their sizes, which one would require more paint?" }, { "from": "gpt", "value": "The black wrought iron balcony at upper center might be wider than metallic pole at left, so it would require more paint." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1b0d0e8260cb87e.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.787, 0.808) or (0.253, 0.203)?" }, { "from": "gpt", "value": "The point (0.253, 0.203) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1497087164dc7f50.jpg", "conversations": [ { "from": "human", "value": "\nIs black plastic recycling bin at left bigger than black plastic bin at left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9d069d50f51dfb6.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer taking a picture of the passengers on the roller coaster. You notice the dark brown hair at center and the blue fabric shirt at center. Which object should you focus on to capture the one that is taller?" }, { "from": "gpt", "value": "The dark brown hair at center is much taller than the blue fabric shirt at center, so you should focus on the dark brown hair at center to capture the taller object." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea73738bb6770471.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance measurement between green grassy at lower center and white matte cottage at center?" }, { "from": "gpt", "value": "green grassy at lower center and white matte cottage at center are 4.55 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26bd8577dafa460a.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.007, 0.702) from camera?" }, { "from": "gpt", "value": "Point (0.007, 0.702) is 3.76 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a9d875da7bf8ba0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the camera position. You want to take a picture of the black matte dress at center. Is the dress within your camera frame?" }, { "from": "gpt", "value": "The black matte dress at center is 24.26 meters from the camera. Since most cameras can focus on objects up to 20 meters away, the dress might be slightly out of focus or require a zoom lens to capture clearly. Adjust your camera settings or move closer for a better shot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cefefb71e462fa6.jpg", "conversations": [ { "from": "human", "value": "\nLocate all matte plastic heart at center in the image." }, { "from": "gpt", "value": "[(0.512, 0.430)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b946a69c6cb4f503.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up a photo shoot. You see the smooth black mouse at lower center and the yellow rubber band at wrist in the scene. Which object is closer to the camera?" }, { "from": "gpt", "value": "The yellow rubber band at wrist is closer to the camera because the smooth black mouse at lower center is positioned under it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92ac3be23af19b7a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny metallic bicycle at center is positioned above shiny red bicycle at center?" }, { "from": "gpt", "value": "Actually, shiny metallic bicycle at center is below shiny red bicycle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59ac1de12cc62df2.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.516, 0.738)?" }, { "from": "gpt", "value": "dull brown mud at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/121fedf358e44ecd.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a charity event and need to display two items from the image. The matte gray coat at center and the floral print scarf at center must be placed on a mannequin. Since space is limited, which item should you place first to ensure both fit properly?" }, { "from": "gpt", "value": "The matte gray coat at center is larger in size than the floral print scarf at center, so you should place the larger matte gray coat at center first to ensure both items fit on the mannequin." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c9061943cf4b12b.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy palm tree at center wider than silhouette leafy palm at center?" }, { "from": "gpt", "value": "Yes, green leafy palm tree at center is wider than silhouette leafy palm at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18c75e1034ccd6f4.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green matte sweatshirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.301, 0.495)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4d6998cc2a8d77d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, smooth sand beach at center or brown fur dog at center, stands shorter?" }, { "from": "gpt", "value": "brown fur dog at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d8239155772749a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green textured evergreen tree at center is positioned to the right of snow-covered pine tree at center?" }, { "from": "gpt", "value": "In fact, green textured evergreen tree at center is to the left of snow-covered pine tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ab3dd4f4a1d17f6.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte brown dome at upper left and smooth beige spire at right, which one is positioned higher?" }, { "from": "gpt", "value": "Positioned higher is matte brown dome at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0531add3e8c3d9ec.jpg", "conversations": [ { "from": "human", "value": "\nYou are a passenger in the back seat of a car and want to know which object in front of you is narrower between the light beige hoodie at center and the yellow plastic taxi at center. Which one is narrower?" }, { "from": "gpt", "value": "The light beige hoodie at center is thinner than the yellow plastic taxi at center, so the light beige hoodie at center is narrower." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c4da59c7407149f.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.239, 0.716) from camera?" }, { "from": "gpt", "value": "Point (0.239, 0.716) is 227.28 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b96313e9c7353907.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.273, 0.617) lie behind point (0.255, 0.161)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf39595c48aa89ec.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the black fabric couch at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.778, 0.525)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcdcd9ab5f8f3cfe.jpg", "conversations": [ { "from": "human", "value": "\nIs tan mesh shoes at center positioned in front of tan suede sandal at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09cb95c776d4fc67.jpg", "conversations": [ { "from": "human", "value": "\nYou are a physical therapist standing 10 feet away from the black plastic wheelchair at center. You need to retrieve a therapy tool from a shelf behind you. Can you reach the shelf without moving closer to the wheelchair?" }, { "from": "gpt", "value": "The black plastic wheelchair at center is 7.56 feet away from the viewer. Since you are standing 10 feet away, you are farther than the wheelchair. Therefore, the shelf behind you is accessible without moving closer to the wheelchair." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77c3568661f6526b.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, dull brown dirt at center or green leafy trees at right?" }, { "from": "gpt", "value": "green leafy trees at right is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddb0ba4e8a48ec36.jpg", "conversations": [ { "from": "human", "value": "\nYou are observing two flies on a wooden surface. The scene includes a shiny black fly at center and a black glossy fly at center. Which fly is located to the left of the other?" }, { "from": "gpt", "value": "The shiny black fly at center is positioned on the left side of the black glossy fly at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6542f9149159cfe7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green textured pine tree at upper right is taller than green textured tree at upper left?" }, { "from": "gpt", "value": "Indeed, green textured pine tree at upper right has a greater height compared to green textured tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fd5910243bfe909.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.426, 0.948) come behind point (0.143, 0.773)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7726749947b23b0b.jpg", "conversations": [ { "from": "human", "value": "\nBetween purple fabric at left and teal fabric headscarf at upper left, which one is positioned lower?" }, { "from": "gpt", "value": "purple fabric at left is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fac4b581319c1df9.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, white smooth house at center or green wooden cottage at upper right?" }, { "from": "gpt", "value": "green wooden cottage at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbb2714451ef1abf.jpg", "conversations": [ { "from": "human", "value": "\nPoint to dark gray fabric pants at center.Point to the dark gray fabric pants at center in the image." }, { "from": "gpt", "value": "[(0.450, 0.544)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41c9b29194043c45.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.670, 0.317) more distant than point (0.652, 0.812)?" }, { "from": "gpt", "value": "Yes, point (0.670, 0.317) is behind point (0.652, 0.812)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dda32fb700539a10.jpg", "conversations": [ { "from": "human", "value": "\nDoes brick building at center have a smaller size compared to black wrought iron gate at center?" }, { "from": "gpt", "value": "No, brick building at center is not smaller than black wrought iron gate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e9a3d0573a6dcce.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, matte gray sweater at center or gray hoodie at upper right, stands shorter?" }, { "from": "gpt", "value": "gray hoodie at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06a224b6c50bed29.jpg", "conversations": [ { "from": "human", "value": "\nIs rusty stone wall at center positioned in front of green leafy tree at upper center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ac947019ecb225f.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the satin blue suit at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.945, 0.491)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/710a1df28dae3a08.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer adjusting the focus on your camera. You need to ensure that both the pink satin blouse at center and the silver metallic necklace at center are in sharp focus. Given that your camera has a depth of field that can cover 12 inches, will both items be in focus?" }, { "from": "gpt", "value": "The distance between the pink satin blouse at center and the silver metallic necklace at center is 11.67 inches, which is within the camera depth of field of 12 inches. Therefore, both items will be in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6e8c5a857721f65.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green leafy tree at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.185, 0.266)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1edbcce352ce8e89.jpg", "conversations": [ { "from": "human", "value": "\nWhere is the gray matte shirt at center located in the image?" }, { "from": "gpt", "value": "The gray matte shirt at center is located at point coordinates of 0.684 on the x axis and 0.619 on the y axis." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29c38c92d585e8bc.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up a shoot in this living room. You want to position a small lamp between the matte gray couch at center and the yellow matte shirt at center. Based on their positions, where should the lamp be placed relative to the couch?" }, { "from": "gpt", "value": "The lamp should be placed above the matte gray couch at center since the yellow matte shirt at center is above it, and the lamp needs to be between them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f4e143ab3135569.jpg", "conversations": [ { "from": "human", "value": "\nIs fluffy yellow wig at center to the left of rubber-like brown hand at center from the viewer's perspective?" }, { "from": "gpt", "value": "Correct, you'll find fluffy yellow wig at center to the left of rubber-like brown hand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32c9e83c9c6e5e7a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a botanist studying ferns in this forest. You observe two ferns labeled as green leafy fern at center and green leafy fern at lower center. Which fern is shorter?" }, { "from": "gpt", "value": "The green leafy fern at center is shorter than the green leafy fern at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e340aa9541944e0d.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the blue denim jacket at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.810, 0.667)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00bcb48aed8e6b36.jpg", "conversations": [ { "from": "human", "value": "\nIs clear water at center smaller than clear glass water at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e05cdf294d7a59ed.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.856, 0.811) or (0.348, 0.745)?" }, { "from": "gpt", "value": "Point (0.856, 0.811)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64ea628f02c13dec.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, blue corrugated metal buildings at center or rocky gray mountain at center?" }, { "from": "gpt", "value": "blue corrugated metal buildings at center is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96e3d21b5db4fea0.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, green rubber surfboard at center or smooth yellow surfboard at center?" }, { "from": "gpt", "value": "From the viewer's perspective, smooth yellow surfboard at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f06f7ae1cb9d4da4.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.600, 0.772) and point (0.457, 0.748), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.457, 0.748) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af6b4b31659fbbe9.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.632, 0.542) from the camera?" }, { "from": "gpt", "value": "Point (0.632, 0.542) and camera are 3.80 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/113fd4d785f2480e.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, matte blue parking sign at center or white matte sign at center?" }, { "from": "gpt", "value": "matte blue parking sign at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b48fa30092af075.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.324, 0.930) to camera." }, { "from": "gpt", "value": "Point (0.324, 0.930) is 4.97 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ca46eb489e92f91.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, brown matte sweater at center or purple textured jacket at left?" }, { "from": "gpt", "value": "brown matte sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69da1c75aabd105c.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green fabric cape at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.247, 0.792)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08c8f95a7d5173e2.jpg", "conversations": [ { "from": "human", "value": "\nDoes green chain-link fence at upper center have a greater height compared to spotted fur dog at center?" }, { "from": "gpt", "value": "In fact, green chain-link fence at upper center may be shorter than spotted fur dog at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2296e557be4008a3.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte black shirt at right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.929, 0.516)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f2a50a65e20b7bf.jpg", "conversations": [ { "from": "human", "value": "\nYou are a mountain rescue team member assessing the cable car system. The metallic yellow cable car at center and the blue metallic cable car at upper center are both suspended on the same cable. Which cable car has a greater chance of causing instability in the cable system due to its width?" }, { "from": "gpt", "value": "The metallic yellow cable car at center might be wider than blue metallic cable car at upper center, so it has a greater chance of causing instability in the cable system due to its width." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9004fa28aa9b1785.jpg", "conversations": [ { "from": "human", "value": "\nWhat are the coordinates of the spotted fur dog at center?" }, { "from": "gpt", "value": "The coordinates of the spotted fur dog at center are at point (0.486, 0.487)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9cf6ef1f75a9535.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.998, 0.708) and point (0.840, 0.050), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.998, 0.708)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/163d29c2ac72aaf4.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red cabin at lower left appear under green wooden cabin at center?" }, { "from": "gpt", "value": "Correct, matte red cabin at lower left is located below green wooden cabin at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d4429c521885545.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a striped cotton shirt at center. Pinpoint a point to the striped cotton shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.218, 0.555)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1ed8d0e9d08dbc5.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is gray fleece hoodie at center from camera?" }, { "from": "gpt", "value": "A distance of 12.63 meters exists between gray fleece hoodie at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0267eecd98cfc17b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the room and want to reach the point marked as point (0.446, 0.525). How far do you need to walk?" }, { "from": "gpt", "value": "The point (0.446, 0.525) is 6.84 feet away from the viewer, so you need to walk 6.84 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/424c17d73223ed6c.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the brown dirt field at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.517, 0.823)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0e2de6e0ffcbb67.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of white cotton shirt at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.589, 0.508)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/580e1ca3064a9362.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center lie behind teal matte suv at lower right?" }, { "from": "gpt", "value": "Yes, green leafy tree at center is further from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/578b11d208977066.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of wooden table at center less distant than that of white cotton shirt at left?" }, { "from": "gpt", "value": "Yes, it is in front of white cotton shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/514b4fa7dbf59258.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to knitted scarf at center? Please provide its 2D coordinates.Where can I find knitted scarf at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.776, 0.797)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51654ea261f4bdd7.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.395, 0.323) or point (0.109, 0.645)?" }, { "from": "gpt", "value": "The point (0.395, 0.323) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29757c563830463b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.548, 0.373) or point (0.883, 0.798)?" }, { "from": "gpt", "value": "The point (0.548, 0.373) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d871c3ea2a4ef289.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte shirt at center bigger than white paper at center?" }, { "from": "gpt", "value": "Indeed, white matte shirt at center has a larger size compared to white paper at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f166cf9699fafbfb.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the green leafy plant at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.363, 0.403)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05ae023e1dd946ed.jpg", "conversations": [ { "from": "human", "value": "\nIs maroon silk robe at lower left closer to camera compared to matte gold robe at center?" }, { "from": "gpt", "value": "Yes, maroon silk robe at lower left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9de962a35767b836.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.629, 0.641) come farther from viewer compared to point (0.630, 0.634)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.630, 0.634)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64e63414195d434a.jpg", "conversations": [ { "from": "human", "value": "\nDoes black leather chair at lower center have a larger size compared to matte black chair at lower right?" }, { "from": "gpt", "value": "Correct, black leather chair at lower center is larger in size than matte black chair at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db6eba7140d6eb0b.jpg", "conversations": [ { "from": "human", "value": "\nIs ivory satin dress at center bigger than white lace dress at left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5dea78fee678f2df.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.014, 0.744) or (0.530, 0.997)?" }, { "from": "gpt", "value": "Point (0.014, 0.744)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ffbcacdc8c0f014.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist trying to sketch this scene. You want to ensure the cloudy sky at upper center and the silhouette wood barn at center are positioned correctly in terms of depth. Which object should you draw first to establish the background?" }, { "from": "gpt", "value": "The cloudy sky at upper center should be drawn first as it is further away from the viewer compared to the silhouette wood barn at center, making it part of the background." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/509bf90e447e1b26.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the beach and see the white plastic boat at center. If you want to walk to the boat, how far do you have to walk?" }, { "from": "gpt", "value": "The white plastic boat at center is 339.54 feet away from you, so you have to walk 339.54 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78dc26e6377e8126.jpg", "conversations": [ { "from": "human", "value": "\nLocate wooden cabinet at upper center in the image." }, { "from": "gpt", "value": "[(0.161, 0.839)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c88d18b0a61b7344.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the classroom and want to reach the point at coordinates point (0.199, 0.891). How far do you need to walk to get there?" }, { "from": "gpt", "value": "The distance between you and the point (0.199, 0.891) is 7.29 feet, so you need to walk 7.29 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3406d26fd2d04b86.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the position of the viewer. There is a point marked at coordinates point (0.442, 0.755) in the scene. How far away is that point from you?" }, { "from": "gpt", "value": "The point (0.442, 0.755) is 4.87 feet away from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d45f9e03c20b037.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between rugged stone mountain at upper center and metallic silver car at lower center." }, { "from": "gpt", "value": "188.55 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d805ca2084784454.jpg", "conversations": [ { "from": "human", "value": "\nYou are a soccer coach analyzing the players on the field. You notice the green jersey at center and the matte green shorts at center. Which item is wider in the image?" }, { "from": "gpt", "value": "The green jersey at center might be wider than matte green shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ba67d647d2def3d.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte white sign at upper left have a lesser width compared to black plastic sunglasses at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3c4087c5e91b492.jpg", "conversations": [ { "from": "human", "value": "\nIs white fluffy cloud at upper left positioned in front of green matte tree at upper center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ade19dff283815a6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the brown sandy beach at lower left and want to reach the shiny metallic water at left. How far do you need to walk to get there?" }, { "from": "gpt", "value": "The distance between the brown sandy beach at lower left and the shiny metallic water at left is 24.08 meters, so you need to walk 24.08 meters to reach the water." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d71c4a7d54673b8e.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white cotton shirt at upper right located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.849, 0.102)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73027590aa1548f8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue striped long-sleeve shirt at center is shorter than black matte hoodie at right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/048ae7418552e2a5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to load a package that requires a minimum of 6 feet of space between the shiny red school bus at center and the white plastic license plate at lower center. Is there enough space?" }, { "from": "gpt", "value": "The distance between the shiny red school bus at center and the white plastic license plate at lower center is 5.77 feet, which is less than the required 6 feet. Therefore, there is not enough space to load the package." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b902c6313b34e93.jpg", "conversations": [ { "from": "human", "value": "\nYou are a guest in this hotel room and want to place a 12 inch wide decorative pillow between the pink fabric at center and the pink fabric doll at left. Is there enough space to fit the pillow between them?" }, { "from": "gpt", "value": "The pink fabric at center and the pink fabric doll at left are 30.03 inches apart from each other. Since the pillow is 12 inches wide, there is enough space to place it between them as 30.03 inches is greater than 12 inches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdb4ee1add4e7843.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point marked as point (0.377, 0.816). How far do you need to walk to get there?" }, { "from": "gpt", "value": "You need to walk 1.14 meters to reach point (0.377, 0.816) from your current position at the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b987cee2822f13e2.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist examining the sculpture and the surrounding area. You want to know which object has a greater thickness between the rusty clay face at center and the green grass at lower center. Which one is thicker?" }, { "from": "gpt", "value": "The green grass at lower center is thicker than the rusty clay face at center, as the description states that the rusty clay face at center is thinner than the green grass at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d22cac5d96ca79c.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.660, 0.948) to camera." }, { "from": "gpt", "value": "They are 38.23 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b502a35278b33ba.jpg", "conversations": [ { "from": "human", "value": "\nIs navy blue sweater at center positioned behind matte gray sweater at left?" }, { "from": "gpt", "value": "No, navy blue sweater at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26929d563a28add6.jpg", "conversations": [ { "from": "human", "value": "\nBetween gray ice at center and snow-covered trees at center, which one is positioned higher?" }, { "from": "gpt", "value": "snow-covered trees at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e16cad53b11af543.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.875, 0.583)?" }, { "from": "gpt", "value": "beige fabric vest at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cae5001413277c60.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of stone building at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.327, 0.450)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48aaa5d856736c38.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the orange fabric racing seat at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.610, 0.755)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d698b6bb4196e6b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown wood flooring at center is shorter than matte black t-shirt at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6fe6c57eb1d3563.jpg", "conversations": [ { "from": "human", "value": "\nWhere is sandy at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.405, 0.828)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ccb62a6e9f6b1e02.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of rocky gray mountain at center in the image." }, { "from": "gpt", "value": "[(0.790, 0.250)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23099dca5e4aeccd.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of pink glossy tongue at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.516, 0.564)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ccb9c8042d53e3f1.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white matte t-shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.367, 0.658)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25edf2adef4991fb.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect planning to install a new decorative element between the white marble column at left and the white marble column at center. The element requires a minimum of 8 meters of space. Can the space between them accommodate this requirement?" }, { "from": "gpt", "value": "The white marble column at left is 8.27 meters away from the white marble column at center, which exceeds the minimum requirement of 8 meters. Therefore, the space between them can accommodate the new decorative element." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00dddbb0de019faf.jpg", "conversations": [ { "from": "human", "value": "\nLocate all matte blue dress at upper left in the image." }, { "from": "gpt", "value": "[(0.165, 0.072)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbe102cdc700ef69.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white matte door at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.899, 0.498)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd4cfb15f9631094.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of smooth black sweater at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.554, 0.670)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce651d6e7cd207bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, greenish water at center or white canvas boat at center?" }, { "from": "gpt", "value": "white canvas boat at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/255312a3aa9bfcc4.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.238, 0.536) or point (0.277, 0.914)?" }, { "from": "gpt", "value": "Point (0.277, 0.914)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69b3c8b528c76da9.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the matte brown cardigan at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.163, 0.648)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b92216afb6b19f0.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray suit at center below suede jacket at center?" }, { "from": "gpt", "value": "Correct, dark gray suit at center is located below suede jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe1afdbc702022f4.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.472, 0.128) positioned after point (0.239, 0.842)?" }, { "from": "gpt", "value": "No, (0.472, 0.128) is in front of (0.239, 0.842)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cdc2514080e4871.jpg", "conversations": [ { "from": "human", "value": "\nHow close is black knitted beanie at upper center from teal plastic glasses at center?" }, { "from": "gpt", "value": "black knitted beanie at upper center is 12.39 inches away from teal plastic glasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7045b61c49094f2e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer planning to take a portrait of the person sitting on the gray rough bark tree trunk at center. You notice the black soft jacket at center is partially covering the view. Can you adjust your position so that the jacket is no longer blocking the tree trunk?" }, { "from": "gpt", "value": "The black soft jacket at center is above the gray rough bark tree trunk at center, so moving your camera position slightly downward might allow you to capture the tree trunk without the jacket obstructing the view." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80cb88d7f89ea988.jpg", "conversations": [ { "from": "human", "value": "\nBased on the scene description, where is the dark brown hair at center located in terms of coordinates?" }, { "from": "gpt", "value": "The dark brown hair at center is located at coordinates point (0.274, 0.700)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b38f6d76fdb9d9d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden at lower center is positioned above white matte plastic bag at upper center?" }, { "from": "gpt", "value": "No, wooden at lower center is not above white matte plastic bag at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e848e43e4b8b2912.jpg", "conversations": [ { "from": "human", "value": "\nYou are trying to decide whether to place the hardcover book at lower left onto the wooden bookcase at upper center. Based on their sizes, will the book fit vertically on the bookcase?" }, { "from": "gpt", "value": "The wooden bookcase at upper center has a greater height compared to the hardcover book at lower left, so the book will fit vertically on the bookcase." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0760336e2c0e8a7.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the clear blue water at lower left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.306, 0.923)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4af81564a7bcf2e4.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the subway platform and want to reach a specific point marked at coordinates point (0.100, 0.009). How far is this point from you?" }, { "from": "gpt", "value": "The point (0.100, 0.009) is 4.87 meters away from you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2cb3a212ea379e08.jpg", "conversations": [ { "from": "human", "value": "\nHow much distance is there between shiny bronze bust at center and shiny silver beard at center?" }, { "from": "gpt", "value": "shiny bronze bust at center and shiny silver beard at center are 3.87 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a56d2bf3692d7c33.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear water at center appear over green leafy tree at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fda0f24bdc215c55.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance measurement between green leafy tree at center and green leafy tree at upper right?" }, { "from": "gpt", "value": "The distance of green leafy tree at center from green leafy tree at upper right is 5.47 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0abd0a49cff716b.jpg", "conversations": [ { "from": "human", "value": "\nPoint to blue striped shirt at right.Point to the blue striped shirt at right in the image." }, { "from": "gpt", "value": "[(0.762, 0.609)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b9f256267354d8b.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at left below green leafy tree at right?" }, { "from": "gpt", "value": "Yes, green leafy tree at left is below green leafy tree at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17084154df30c112.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist trying to sketch this scene. You need to place the dark brown textured hair at center accurately. What are the coordinates where you should position it?" }, { "from": "gpt", "value": "The dark brown textured hair at center should be placed at coordinates point (0.446, 0.348)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32770fb0b4375f04.jpg", "conversations": [ { "from": "human", "value": "\nBetween black leather shoes at center and black leather shoe at center, which one has less height?" }, { "from": "gpt", "value": "With less height is black leather shoe at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6c988f68807c5d0.jpg", "conversations": [ { "from": "human", "value": "\nYou are an ornithologist observing the sky with your telescope. You notice two birds in the image, the dark feathered bird at bottom left and the dark feathered bird at upper right. Based on their positions in the sky, which bird appears closer to you?" }, { "from": "gpt", "value": "The dark feathered bird at bottom left appears closer because it is shorter than the dark feathered bird at upper right, which suggests it is farther away." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0b3149688ab0eff.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue fabric jacket at center is positioned to the left of dark blue fabric couple at center?" }, { "from": "gpt", "value": "No, blue fabric jacket at center is not to the left of dark blue fabric couple at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3970b54cdb98c39.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.530, 0.303)?" }, { "from": "gpt", "value": "Point (0.530, 0.303) is 9.39 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac34ba3769775188.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black car at lower left closer to the viewer compared to black wire at upper left?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da5c59c57b888126.jpg", "conversations": [ { "from": "human", "value": "\nYou are a medical professional examining the hand injury. You notice two points marked on the image. The first point is at coordinates point (0.602, 0.352) and the second is at point (0.092, 0.966). Which point is closer to the viewer?" }, { "from": "gpt", "value": "Point (0.092, 0.966) is closer to the viewer because point (0.602, 0.352) is behind it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b1dbc8b7f780629.jpg", "conversations": [ { "from": "human", "value": "\nYou are an airport staff member checking the positions of passengers. You see the white matte jacket at left and the matte black backpack at center. Which passenger is closer to the floor?" }, { "from": "gpt", "value": "The white matte jacket at left is closer to the floor because it is below the matte black backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66057a170f03fe81.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the white satin shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.247, 0.792)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/725e32f4d5c11f29.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.162, 0.786) or (0.462, 0.798)?" }, { "from": "gpt", "value": "Point (0.162, 0.786) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff5892a84458a00f.jpg", "conversations": [ { "from": "human", "value": "\nWhere is blue jeans at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.455, 0.305)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bff8a67a43f38ae1.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist planning to paint the autumn scene. You have a brush that can cover an area of 10 cm. You need to paint both the autumn leaves at left and the brown grass at center. Which object requires a larger brush to cover its width?" }, { "from": "gpt", "value": "The autumn leaves at left might be wider than brown grass at center, so you should use a larger brush for the autumn leaves at left to ensure proper coverage." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca50bad21c202d24.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of white wooden table at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.510, 0.584)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab065247197eda1e.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the smooth plastic house at right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.921, 0.291)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce400968d957f141.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to place the leathery brown leaf at lower left and the matte orange pumpkin at center on a shelf. If the shelf can only hold items up to the width of the pumpkin, will the leaf fit on the same shelf?" }, { "from": "gpt", "value": "The leathery brown leaf at lower left has a width less than the matte orange pumpkin at center, so it will fit on the shelf since its width is smaller than the pumpkin." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87241d477cf0d346.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a closeup shot of both the black matte swimsuit at center and the black matte bikini at center. The camera you are using has a minimum focusing distance of 5 feet. Can you focus on both subjects simultaneously?" }, { "from": "gpt", "value": "The distance between the black matte swimsuit at center and the black matte bikini at center is 4.68 feet, which is less than the camera minimum focusing distance of 5 feet. Therefore, the camera can focus on both subjects simultaneously." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/966b4b24e0a3c993.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from pearl white chandelier at upper right to camera." }, { "from": "gpt", "value": "A distance of 2.88 meters exists between pearl white chandelier at upper right and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82f194f02d5b235d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to park your vehicle in a tight parking spot that can only accommodate a vehicle that takes up less space. You have a shiny silver car at center and a rusty metal truck at right. Which vehicle should you choose to park in the spot?" }, { "from": "gpt", "value": "You should choose the shiny silver car at center because it occupies less space than the rusty metal truck at right, making it suitable for the tight parking spot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7f5c8fe42279bc0.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.298, 0.827) less distant than point (0.535, 0.650)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2718c7d5158cd151.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between white matte boat at center and camera?" }, { "from": "gpt", "value": "white matte boat at center is 37.82 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6ce3bc877a4289b.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between white metallic trailer truck at right and camera." }, { "from": "gpt", "value": "white metallic trailer truck at right is 4.90 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09826a74de22ee15.jpg", "conversations": [ { "from": "human", "value": "\nDoes brick paved path at center appear on the right side of green leafy palm tree at right?" }, { "from": "gpt", "value": "Incorrect, brick paved path at center is not on the right side of green leafy palm tree at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fbc2a855af7eac6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if silky white gown at center is shorter than white cotton blouse at center?" }, { "from": "gpt", "value": "Incorrect, silky white gown at center's height does not fall short of white cotton blouse at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29c54f0aa6591924.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy palm tree at lower left have a greater height compared to green leafy palm tree at center-right?" }, { "from": "gpt", "value": "In fact, green leafy palm tree at lower left may be shorter than green leafy palm tree at center-right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53ca078faf49a036.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, matte brown notepad at left or matte black pen at left, stands taller?" }, { "from": "gpt", "value": "matte brown notepad at left is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99a82fb077637ee6.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between blue smooth water at lower center and camera." }, { "from": "gpt", "value": "blue smooth water at lower center and camera are 14.57 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1efac05f1b2b8c28.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the playground and want to go to the green rubber slide at left. Which direction should you move in to reach it?" }, { "from": "gpt", "value": "The green rubber slide at left is located at point 0.461 on the x and 0.244 on the y, so you should move towards the left and slightly forward to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e466cb4dd10c802e.jpg", "conversations": [ { "from": "human", "value": "\nIs translucent glass flower at center smaller than matte black sweater at lower right?" }, { "from": "gpt", "value": "Actually, translucent glass flower at center might be larger than matte black sweater at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6dabf72b0f78d71e.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect designing a new building and want to ensure that the sunlight reaches the garden below the window. Based on the image, where is the position of the bare branches at center relative to the window panes?" }, { "from": "gpt", "value": "The bare branches at center are positioned at coordinates point (0.811, 0.300), which means they are located near the lower part of the window, potentially blocking some sunlight from reaching the garden below. To allow more sunlight, consider adjusting the branch placement or window design." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7d0671b51942903.jpg", "conversations": [ { "from": "human", "value": "\nBetween copper wire mesh cage at center and light brown wooden stool at right, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "copper wire mesh cage at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/090ae48c767f7b0e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.598, 0.266) in front of point (0.004, 0.256)?" }, { "from": "gpt", "value": "Yes, point (0.598, 0.266) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83b7336b0d0fc85c.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any green grass at lower center in the image." }, { "from": "gpt", "value": "[(0.516, 0.930)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95e512622425694c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the blue water at lower center and want to look at the gold textured lantern at upper right. Can you see it clearly without moving your head?" }, { "from": "gpt", "value": "The gold textured lantern at upper right is behind blue water at lower center, so you cannot see it clearly without moving your head." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a4dfd46f61c0fa9.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.389, 0.497) farther from camera compared to point (0.094, 0.398)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7ecd9a774c05dff.jpg", "conversations": [ { "from": "human", "value": "\nHow distant is matte black cigarette at upper left from brown textured tobacco at upper center?" }, { "from": "gpt", "value": "matte black cigarette at upper left is 4.56 feet from brown textured tobacco at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5032e500985a4edd.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to shiny blue vest at center? Please provide its 2D coordinates.Where can I find shiny blue vest at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.758, 0.408)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/349ced7c160fa746.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.864, 0.477) come farther from viewer compared to point (0.381, 0.675)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb7cee43ccb25e6d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.622, 0.716) or point (0.592, 0.653)?" }, { "from": "gpt", "value": "Point (0.592, 0.653) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76765de3add32d35.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.288, 0.380)?" }, { "from": "gpt", "value": "dark blue fabric at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed81b8127ac2981b.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.014, 0.405) closer to camera compared to point (0.600, 0.645)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.600, 0.645)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74c1f05f07eea827.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of polished chrome mirror at center more distant than that of polished chrome ladder at center?" }, { "from": "gpt", "value": "Yes, polished chrome mirror at center is behind polished chrome ladder at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a726c638f230abc1.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of coarse textured palm tree at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.777, 0.195)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c27e19622c840e7c.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.017, 0.680) more distant than point (0.399, 0.256)?" }, { "from": "gpt", "value": "No, it is in front of (0.399, 0.256)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92a999d22a690c04.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte polo shirt at left have a lesser width compared to blue cotton polo shirt at center?" }, { "from": "gpt", "value": "Indeed, white matte polo shirt at left has a lesser width compared to blue cotton polo shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8bb5d5d680b86b96.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, yellow matte shirt at center or yellow matte shirt at lower right?" }, { "from": "gpt", "value": "yellow matte shirt at lower right is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1dd5aff2c497f42.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.219, 0.647) closer to camera compared to point (0.616, 0.502)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6859d740ee12839.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.046, 0.800) or (0.261, 0.109)?" }, { "from": "gpt", "value": "Point (0.046, 0.800) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92f32755c339dbfe.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the greenish water at lower left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.576, 0.866)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e509baf1a3a6e9f.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a yard sale and want to place a new item between the blue denim dress at center and the cardboard box at lower center. Can you fit it there if the item is 0.5 meters wide?" }, { "from": "gpt", "value": "The blue denim dress at center is narrower than the cardboard box at lower center. Since the dress is narrower, the space between them might accommodate the 0.5 meter wide item, but exact placement depends on their exact positions. However, based on the width comparison alone, it could potentially fit." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c46f6c6d7a8ddb80.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.607, 0.559)?" }, { "from": "gpt", "value": "blue fabric couch at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69f7b8bf4a6bb0c7.jpg", "conversations": [ { "from": "human", "value": "\nDoes white smoke at center appear under green textured tree at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e2eb5f09db4a30f.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white metal radiator at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.385, 0.381)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/133120515221ec81.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.623, 0.258) and want to walk back to your starting position. How far do you need to walk?" }, { "from": "gpt", "value": "You need to walk 31.38 meters to return to your starting position since the distance between point (0.623, 0.258) and the viewer is 31.38 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/901645c1bb632d0c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of cloudy sky at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.494, 0.180)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b92476faa4063853.jpg", "conversations": [ { "from": "human", "value": "\nYou are an art student analyzing a portrait. You notice the brown woolen sweater at center and the black ink signature at lower right. Based on their positions in the image, which object is closer to the top of the portrait?" }, { "from": "gpt", "value": "The brown woolen sweater at center is located above the black ink signature at lower right, so it is closer to the top of the portrait." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63b4ab49dd9db401.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to set up a picnic blanket in the backyard scene. Given the presence of the green grass at center and the metallic red ladder at center, which object would allow more space for the blanket?" }, { "from": "gpt", "value": "The green grass at center has a larger size compared to the metallic red ladder at center, so it would provide more space for the picnic blanket." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfc00800d17cc2f1.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the matte brown paper bag at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.891, 0.583)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a2e09e05655fc70.jpg", "conversations": [ { "from": "human", "value": "\nBetween gray matte concrete at center and reflective yellow vest at center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, reflective yellow vest at center appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c85ba48b2ac64cff.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.269, 0.928) farther from camera compared to point (0.208, 0.261)?" }, { "from": "gpt", "value": "No, it is in front of (0.208, 0.261)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5115add22f917479.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.524, 0.487) and point (0.678, 0.577), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.678, 0.577) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07607c1b34b524c2.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between brown wood bench at center and white matte hoodie at center?" }, { "from": "gpt", "value": "brown wood bench at center is 22.59 inches away from white matte hoodie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38c09d6b97a2d047.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator tasked with delivering a package to the brown tile roof at center. Your drone must fly over the brick chimney at left to reach it. Is this path possible given their positions?" }, { "from": "gpt", "value": "The brown tile roof at center is located below the brick chimney at left, so the drone can fly over the brick chimney at left to reach the brown tile roof at center as it is positioned lower." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f4ce4713170fe3a.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the camouflage fabric uniform at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.208, 0.375)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e123aeaa7f76f48.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of white fluffy snow at center more distant than that of sunglasses at right?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00f03ff0eee0b5a3.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.584, 0.719)?" }, { "from": "gpt", "value": "floral fabric bed at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/270a5f603597ef57.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.228, 0.564) from the camera?" }, { "from": "gpt", "value": "A distance of 34.25 meters exists between point (0.228, 0.564) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/797bb5c0b3ed9a72.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.456, 0.083) from camera?" }, { "from": "gpt", "value": "Point (0.456, 0.083) and camera are 46.41 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c7e2286daebff79.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from gray pinstripe suit at right to camera." }, { "from": "gpt", "value": "They are 1.23 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ff2ca09a9ac3b12.jpg", "conversations": [ { "from": "human", "value": "\nDoes glossy water at lower center appear on the left side of white matte swan at right?" }, { "from": "gpt", "value": "Indeed, glossy water at lower center is positioned on the left side of white matte swan at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3f58b3bfc6ea2ac.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown suit at center have a lesser height compared to matte black suit at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae713e46f97ad621.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.706, 0.666) or (0.109, 0.645)?" }, { "from": "gpt", "value": "Point (0.109, 0.645) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96077ee64991c6c0.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the brown stone ruins at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.627, 0.689)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/caa0b6d42efddf28.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a blue long-sleeve shirt at center. Pinpoint a point to the blue long-sleeve shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.360, 0.652)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68b8fea1ab3af0a0.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.497, 0.705) from camera?" }, { "from": "gpt", "value": "The distance of point (0.497, 0.705) from camera is 27.09 inches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2964c645577b1c6c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the distance between purple cotton shirt at left and matte white t-shirt at center?" }, { "from": "gpt", "value": "purple cotton shirt at left and matte white t-shirt at center are 13.96 inches apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/778801d7142153d5.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green leafy bush at lower left located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.278, 0.734)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e6b92156bbb0217.jpg", "conversations": [ { "from": "human", "value": "\nIs black metallic suv at center closer to camera compared to white plastic license plate at center?" }, { "from": "gpt", "value": "Yes, black metallic suv at center is in front of white plastic license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ffa06e95f0a5064.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.275, 0.558)?" }, { "from": "gpt", "value": "black cotton t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07c07a88187f43b0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the party and want to take a photo that includes both the leather jacket at upper right and the dark gray jersey at center. Which object should you focus on first to ensure both are in the frame?" }, { "from": "gpt", "value": "The leather jacket at upper right is in front of the dark gray jersey at center, so you should focus on the leather jacket at upper right first to ensure both are in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5314825379ffb5e0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator who needs to fly a drone from the green turf field at center to the blue led display at upper right. What is the distance you need to cover?" }, { "from": "gpt", "value": "The distance between the green turf field at center and the blue led display at upper right is 36.41 meters, so you need to cover 36.41 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/002a6ceffbc2f037.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.942, 0.758) and point (0.170, 0.794), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.942, 0.758) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d8022029749c710.jpg", "conversations": [ { "from": "human", "value": "\nDoes plaid shirt at center appear under green sticky note at upper left?" }, { "from": "gpt", "value": "Indeed, plaid shirt at center is positioned under green sticky note at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc9a0e0c5a4f5f2a.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.590, 0.341) and point (0.545, 0.564), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.545, 0.564)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd4358d653645628.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if transparent glass car window at center is positioned above blue glossy wooden shoes at center?" }, { "from": "gpt", "value": "Yes, transparent glass car window at center is above blue glossy wooden shoes at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fcfb1ae4a968bfb.jpg", "conversations": [ { "from": "human", "value": "\nYou are an audience member sitting in the front row of the theater. You notice the smooth skin person at center and the matte pink dress at center on stage. Which object is positioned to the left from your viewpoint?" }, { "from": "gpt", "value": "The smooth skin person at center is positioned to the left of the matte pink dress at center from the audience member viewpoint." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c224f65da7f8953.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white fluffy cloud at center is smaller than white matte wing at upper left?" }, { "from": "gpt", "value": "No, white fluffy cloud at center is not smaller than white matte wing at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9400c49bbedd04e5.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of camouflage fabric uniform at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.399, 0.772)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f2485169ab41e2c.jpg", "conversations": [ { "from": "human", "value": "\nHow far is knitted woolen hat at center from camera?" }, { "from": "gpt", "value": "The distance of knitted woolen hat at center from camera is 10.88 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a38dc2e56ce9bc55.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.357, 0.169) and point (0.818, 0.972), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.818, 0.972) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c0c32d195890705.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, green matte strip at center or green matte tape at center?" }, { "from": "gpt", "value": "Positioned to the left is green matte tape at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/478c0ece5c6bd5ba.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the amber glass vase at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.265, 0.539)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf760d9cec236222.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a closeup shot of the light blue sweater at center and the fluffy cotton sweater at center. Your camera has a minimum focus distance of 8 inches. Can you focus on both sweaters at the same time?" }, { "from": "gpt", "value": "The distance between the light blue sweater at center and the fluffy cotton sweater at center is 8.72 inches. Since the minimum focus distance is 8 inches, the camera can focus on both sweaters simultaneously as the separation between them is within the required range." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60ff99dd6cdbd8bd.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point marked as point (0.892, 0.447). How far do you need to walk to get there?" }, { "from": "gpt", "value": "The distance of point (0.892, 0.447) from camera is 3.18 meters, so you need to walk 3.18 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/876bf9aed1c094b2.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.893, 0.516) lie in front of point (0.260, 0.900)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f66415d41e8bce4.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.614, 0.695) and camera?" }, { "from": "gpt", "value": "Point (0.614, 0.695) is 4.98 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f781f271f8e35ef.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the asphalt road at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.649, 0.873)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00e9fe2360a545c3.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at upper right taller than gray brick chimney at left?" }, { "from": "gpt", "value": "Indeed, green leafy tree at upper right has a greater height compared to gray brick chimney at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2c1eb609c77315d.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.271, 0.703)?" }, { "from": "gpt", "value": "yellow plaid shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d20e0c4a09c8488.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the concrete pillar at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.430, 0.502)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c75d407623ecfcd.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the edge of the bleachers, trying to capture the killer whales performing. You notice two points in the scene marked as point 1 and point 2. If point 1 is located at coordinate point (0.125, 0.002) and point 2 is at (0.047, 0.658), which point is closer to you?" }, { "from": "gpt", "value": "Point 1 at coordinate point (0.125, 0.002) is closer to you since it is further to the viewer than point 2 at (0.047, 0.658)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9ca61f583cd45b3.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of dark gray suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.340, 0.502)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6fe40e7f5443a84d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person standing 5 meters away from the brown brick building at center. You need to place a package under the matte black awning at center. Can you reach the awning without moving closer than your current position?" }, { "from": "gpt", "value": "The brown brick building at center is 9.40 meters away from the matte black awning at center. Since you are currently 5 meters away from the building, you are still 4.4 meters away from the awning. Therefore, you need to move closer to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfccd0af3acc1f44.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the United States Capitol building and want to take a photo of the white marble dome at center. If you look at the dome, where should you point your camera to capture it in the frame?" }, { "from": "gpt", "value": "You should point your camera towards the center area of the building, specifically at the coordinates approximately 0.597 along the horizontal axis and 0.650 along the vertical axis, where the white marble dome at center is located." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24642d206ec1e415.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue tarp at lower left is taller than blue metallic crane at right?" }, { "from": "gpt", "value": "In fact, blue tarp at lower left may be shorter than blue metallic crane at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd374d0622e3b207.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green grassy at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.443, 0.817)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df92dfabef4b4748.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer positioned at the back of the arena. You want to take a photo that includes both the dark brown leather jacket at center and the green fabric shirt at center. Which one will appear larger in your photo?" }, { "from": "gpt", "value": "The dark brown leather jacket at center will appear larger in the photo because it is closer to the viewer than the green fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bf83ddd001aca47.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the blue painted metal dock at lower center and want to jump into the green water at lower center. Is the dock wide enough to allow you to safely jump into the water without falling off the dock?" }, { "from": "gpt", "value": "The green water at lower center might be wider than blue painted metal dock at lower center, so the dock may not be wide enough to safely jump into the water. It is recommended to ensure stability before jumping." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a3e16e6949cb56a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, white metal hospital bed at left or pink floral dress at center, stands shorter?" }, { "from": "gpt", "value": "Standing shorter between the two is white metal hospital bed at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3e19c4f0de88ab5.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between pastel pink sky at upper center and green matte tree at center?" }, { "from": "gpt", "value": "The distance of pastel pink sky at upper center from green matte tree at center is 226.96 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98633124d29ffe7c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of smooth fabric dress at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.404, 0.694)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba059103eb70332b.jpg", "conversations": [ { "from": "human", "value": "\nYou are a passenger on the platform and want to board the train. You see the white glossy train at left and the light blue denim jacket at upper left. Which object is wider? Please answer based on their widths." }, { "from": "gpt", "value": "The white glossy train at left is wider than the light blue denim jacket at upper left according to their widths." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b95b0ffdcedc5c73.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.296, 0.686)?" }, { "from": "gpt", "value": "navy blue shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0972dcecabd4ac2d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.668, 0.569) or point (0.485, 0.247)?" }, { "from": "gpt", "value": "Point (0.485, 0.247)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87fe7a68c087247f.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.256, 0.884) and camera." }, { "from": "gpt", "value": "Point (0.256, 0.884) and camera are 6.44 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04d5f2305aae50b8.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of dark clothing crowd at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.849, 0.605)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b30d0352d050d12.jpg", "conversations": [ { "from": "human", "value": "\nCould you provide the distance between blue striped shirt at upper right and blue plastic bottle at right?" }, { "from": "gpt", "value": "blue striped shirt at upper right and blue plastic bottle at right are 26.81 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ef8ad1311af338b.jpg", "conversations": [ { "from": "human", "value": "\nDoes black fur rabbit at center have a larger size compared to black furry rabbit at center?" }, { "from": "gpt", "value": "No, black fur rabbit at center is not bigger than black furry rabbit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4843bfc41b18588.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a purple glossy tiles at center. Pinpoint a point to the purple glossy tiles at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.470, 0.428)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0232bbe560de087b.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, smooth wood canoe at lower left or smooth dark skin at center?" }, { "from": "gpt", "value": "smooth dark skin at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d464031fb19db9de.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between transparent glass window at upper center and transparent glass window at upper right?" }, { "from": "gpt", "value": "transparent glass window at upper center and transparent glass window at upper right are 89.94 centimeters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56d244b4320f8c28.jpg", "conversations": [ { "from": "human", "value": "\nLocate the green grassy field at lower center in the image." }, { "from": "gpt", "value": "[(0.456, 0.373)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fd9d96734c21f45.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, matte brown coffee pot at center or brown matte tea pot at center, stands shorter?" }, { "from": "gpt", "value": "brown matte tea pot at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f27af18ad6306b87.jpg", "conversations": [ { "from": "human", "value": "\nHow close is brown cotton shirt at right from gray fabric backpack at center-right?" }, { "from": "gpt", "value": "A distance of 1.35 meters exists between brown cotton shirt at right and gray fabric backpack at center-right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00255bea70504096.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.923, 0.448) closer to viewer compared to point (0.204, 0.720)?" }, { "from": "gpt", "value": "No, it is behind (0.204, 0.720)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ede1e0a6b7bf6bbe.jpg", "conversations": [ { "from": "human", "value": "\nYou are in a room with two points marked on the floor. The first point is at coordinate point(0.472, 0.548) and the second is at point(0.814, 0.620). If you are facing north, which point is closer to your current position?" }, { "from": "gpt", "value": "The point at coordinate point(0.472, 0.548) is behind point point(0.814, 0.620), so if you are facing north, the point at point(0.472, 0.548) would be behind you and farther away from your current position compared to point(0.814, 0.620). Therefore, the closer point is point(0.814, 0.620)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e373fa1c04a02323.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.896, 0.767) or point (0.178, 0.317)?" }, { "from": "gpt", "value": "Positioned in front is point (0.896, 0.767)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b0ecc0681ee798d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer positioned in front of the vintage military aircraft. You want to take a closeup shot of the camouflage fabric uniform at right. How far should you stand from the uniform to capture it clearly?" }, { "from": "gpt", "value": "The camouflage fabric uniform at right is 6.28 meters from viewer. To capture it clearly, you should stand approximately 6.28 meters away from the uniform." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49eb7eb784d1e91f.jpg", "conversations": [ { "from": "human", "value": "\nYou are trying to determine if the matte black glasses at center can fit into a box that is the same width as the matte black beard at center. Based on the spatial relationship between them, can the glasses fit?" }, { "from": "gpt", "value": "The matte black glasses at center might be wider than the matte black beard at center, so they may not fit into a box sized for the beard." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3d3f6099c2d4781.jpg", "conversations": [ { "from": "human", "value": "\nYou are a LEGO enthusiast examining the diorama. You notice the matte yellow figure at upper left and the brown matte teddy bear at center. Which of these two objects is taller?" }, { "from": "gpt", "value": "The matte yellow figure at upper left is taller than the brown matte teddy bear at center according to the description provided." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a05105d633263a8.jpg", "conversations": [ { "from": "human", "value": "\nBetween white matte snow at center and snowy water at center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "white matte snow at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43fe7ec8039b00b6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if fluffy red fabric at center is positioned above matte black shorts at left?" }, { "from": "gpt", "value": "Actually, fluffy red fabric at center is below matte black shorts at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac7c390149853277.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to place a 30 cm wide package between the white glossy mantle at upper center and the wooden frame at upper center. Can you fit the package in the space between them?" }, { "from": "gpt", "value": "The distance between the white glossy mantle at upper center and the wooden frame at upper center is 28.99 centimeters, so the 30 cm wide package cannot fit in the space between them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/326bb3499bad4f69.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.375, 0.583) or (0.863, 0.323)?" }, { "from": "gpt", "value": "Positioned behind is point (0.863, 0.323)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43046f38acce6da1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a visitor approaching the entrance of the Peter J. Shields Library. You notice a pink fabric shirt at lower left and a light brown leather backpack at right. Which object is closer to you as you stand at the entrance?" }, { "from": "gpt", "value": "The pink fabric shirt at lower left is closer to you because it is in front of the light brown leather backpack at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1943cfc915c6ef7.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, orange fabric skirt at left or denim shorts at center?" }, { "from": "gpt", "value": "denim shorts at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/275ad2560e3ccdd5.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of stone bridge at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.686, 0.409)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66e7400b77d85888.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of gray striped shirt at left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.108, 0.673)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8aedaaa43e13200.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.861, 0.341) positioned in front of point (0.935, 0.419)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/361864a89f50d6c6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if camouflage helmet at center is shorter than white matte cap at center?" }, { "from": "gpt", "value": "Indeed, camouflage helmet at center has a lesser height compared to white matte cap at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3952012271b9039a.jpg", "conversations": [ { "from": "human", "value": "\nLocate the green leafy tree at upper left in the image." }, { "from": "gpt", "value": "[(0.423, 0.277)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f72970cb23511be8.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the white sand at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.778, 0.878)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c45cdb130badc176.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the white satin dress at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.369, 0.639)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1aa709d72e93d78.jpg", "conversations": [ { "from": "human", "value": "\nWhere is blue metallic bus at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.532, 0.447)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bbe2a7fffd004be1.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.223, 0.653)?" }, { "from": "gpt", "value": "matte black sunglasses at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/349a0c1cfc3174bc.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to black lace top at center? Please provide its 2D coordinates.Where can I find black lace top at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.418, 0.670)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c96419678e5489e.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden table at center above white matte baseball cap at upper center?" }, { "from": "gpt", "value": "No, wooden table at center is not above white matte baseball cap at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/078e757652d705ee.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange tarp tent at center is positioned to the left of brown fabric tent at center?" }, { "from": "gpt", "value": "Indeed, orange tarp tent at center is positioned on the left side of brown fabric tent at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd2ade404fd91616.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green reflective water at center is positioned to the left of smooth white birch tree at center?" }, { "from": "gpt", "value": "In fact, green reflective water at center is to the right of smooth white birch tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec2be962a889c2ac.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte white shirt at left and white shirt at center, which one is positioned lower?" }, { "from": "gpt", "value": "Positioned lower is matte white shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c081bda69b7725c8.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte gray suit at center appear on the left side of black glossy laptop at center?" }, { "from": "gpt", "value": "Yes, matte gray suit at center is to the left of black glossy laptop at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52e18ef7212d7f47.jpg", "conversations": [ { "from": "human", "value": "\nIs dark green leafy tree at left positioned in front of dark green textured tree at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7220f88ca89ec456.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.506, 0.314) and point (0.996, 0.456), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.506, 0.314) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39650411cf91b9a6.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, desert shrubs at center or rustic stone hole at center?" }, { "from": "gpt", "value": "Standing shorter between the two is rustic stone hole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44329b2df38d0aaa.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.820, 0.436) from camera?" }, { "from": "gpt", "value": "Point (0.820, 0.436) is 6.80 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c04cf7cb53164b23.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, green fabric tank top at center or green fabric tank top at left, stands taller?" }, { "from": "gpt", "value": "green fabric tank top at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa2be7a9c82e158c.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.876, 0.373) in front of point (0.470, 0.494)?" }, { "from": "gpt", "value": "Yes, point (0.876, 0.373) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39255ac12439d51d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, green leafy tree at left or brown textured palm tree at upper center?" }, { "from": "gpt", "value": "Positioned to the right is brown textured palm tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/459296f3855c3815.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a candid shot of a person leaning against a blue door frame on the left side of the frame. You want to ensure the subject is in focus. If your camera has a minimum focusing distance of 20 inches, will you be able to focus on the point at point (0.511, 0.958)?" }, { "from": "gpt", "value": "The distance between the point (0.511, 0.958) and the camera is 20.39 inches. Since the minimum focusing distance is 20 inches, the camera can focus on the point as it is just beyond the minimum requirement." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24c35b3c9f204267.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.712, 0.959) or point (0.033, 0.042)?" }, { "from": "gpt", "value": "Point (0.712, 0.959) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48d4bf8fcffc5546.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.628, 0.211) or point (0.796, 0.459)?" }, { "from": "gpt", "value": "Point (0.796, 0.459)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/331e845c67855e06.jpg", "conversations": [ { "from": "human", "value": "\nLocate the plaid fabric tablecloth at center in the image." }, { "from": "gpt", "value": "[(0.184, 0.863)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/493da889de3fa451.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.304, 0.594)?" }, { "from": "gpt", "value": "Point (0.304, 0.594) is 7.18 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fb25e72a6da1dcf.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, dark gray fabric pants at lower left or white cotton shirt at center?" }, { "from": "gpt", "value": "white cotton shirt at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fae2f7b4f9f13a1b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if soft plush teddy bear at center is bigger than transparent glass window at upper left?" }, { "from": "gpt", "value": "Indeed, soft plush teddy bear at center has a larger size compared to transparent glass window at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04d50343b1a473df.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black pants at left thinner than green matte climbing suit at center?" }, { "from": "gpt", "value": "No, matte black pants at left is not thinner than green matte climbing suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7cbaa8dc9514b65.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.251, 0.661) or (0.851, 0.887)?" }, { "from": "gpt", "value": "Point (0.251, 0.661) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b9ddbb48756adb2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer at the market and want to pick up an item from the table. You notice two points on the table marked as point 1 and point 2. Point 1 is at coordinates (0.131, 0.278) and point 2 is at (0.028, 0.086). If you were to reach for the item at point 1 first, would you have to extend your arm more compared to reaching for point 2?" }, { "from": "gpt", "value": "Since point 1 is closer to the camera than point 2, reaching for point 1 would require less arm extension compared to point 2. Therefore, you would not have to extend your arm more for point 1 than point 2." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03b71eabedd71da1.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.510, 0.659) and camera." }, { "from": "gpt", "value": "Point (0.510, 0.659) and camera are 2.15 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f6ed47ed875b9bb.jpg", "conversations": [ { "from": "human", "value": "\nPoint to white glossy boat at left.Point to the white glossy boat at left in the image." }, { "from": "gpt", "value": "[(0.122, 0.436)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d7793efaac9ca3a.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of matte red jersey at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.929, 0.359)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/139b3e2764326140.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.251, 0.316) more distant than point (0.251, 0.767)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f178b8eb692ed46.jpg", "conversations": [ { "from": "human", "value": "\nLocate all light oak wood door at center in the image." }, { "from": "gpt", "value": "[(0.599, 0.409)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1b6a955ea907a18.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white plastic bag at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.626, 0.541)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49a564221326d0c8.jpg", "conversations": [ { "from": "human", "value": "\nLocate the green water at center in the image." }, { "from": "gpt", "value": "[(0.483, 0.578)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e92159beb4247ec.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white frothy water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.365, 0.266)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f727f9a1125bb5f.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.464, 0.798)?" }, { "from": "gpt", "value": "white plastic car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/930c8cc193cfe323.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.866, 0.325)?" }, { "from": "gpt", "value": "wooden cabin at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/699e1d37dbeb7adf.jpg", "conversations": [ { "from": "human", "value": "\nPoint to green rock mountain at center.Point to the green rock mountain at center in the image." }, { "from": "gpt", "value": "[(0.396, 0.511)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e05f117015543c0f.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.216, 0.519)?" }, { "from": "gpt", "value": "green matte tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0c6dcd7300299d4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at center is positioned to the right of dark gray fluffy cloud at upper left?" }, { "from": "gpt", "value": "Yes, green leafy tree at center is to the right of dark gray fluffy cloud at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27da79c938f45f1a.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.747, 0.617) in front of point (0.756, 0.702)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62b8634c179e6b3e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the rocky shoreline and want to walk to the green leafy trees at center from the blue water at lower left. How far do you need to walk?" }, { "from": "gpt", "value": "The distance between the blue water at lower left and the green leafy trees at center is 42.52 meters, so you need to walk 42.52 meters to reach them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf15b4b2c93c7f44.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the dark blue jacket at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.158, 0.522)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02173feb65039ace.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up a photo shoot in a room with a rocky landscape backdrop. You have two outfits to place on mannequins for a display. The outfits are the white striped polo shirt at upper right and the matte floral dress at lower left. Which outfit should you choose if you want the larger one to be placed on the mannequin closer to the camera?" }, { "from": "gpt", "value": "The white striped polo shirt at upper right is bigger than the matte floral dress at lower left, so you should place the white striped polo shirt at upper right on the mannequin closer to the camera to make it appear larger in the photo." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f09d1f9480da13a3.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.713, 0.255)?" }, { "from": "gpt", "value": "Point (0.713, 0.255) and camera are 9.20 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c694d67dadde5b6d.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, black matte hijab at center or green fabric jacket at center?" }, { "from": "gpt", "value": "With less height is green fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48babff324a07767.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, blue fabric shirt at upper right or dark blue jeans at center?" }, { "from": "gpt", "value": "dark blue jeans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62476e98245a64cc.jpg", "conversations": [ { "from": "human", "value": "\nHow close is reflective yellow vest at center from camera?" }, { "from": "gpt", "value": "A distance of 6.27 meters exists between reflective yellow vest at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16f397b1b3fab669.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black helmet at upper center appear over camouflage fabric helmet at center?" }, { "from": "gpt", "value": "Correct, matte black helmet at upper center is located above camouflage fabric helmet at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ee3c73047582789.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of blue water at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.516, 0.806)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d25ed8fca0122032.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black plastic keyboard at center-right is positioned to the right of matte black monitor at center?" }, { "from": "gpt", "value": "Yes, black plastic keyboard at center-right is to the right of matte black monitor at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cb5c26120dbc6bb.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.301, 0.689) or (0.158, 0.634)?" }, { "from": "gpt", "value": "Positioned in front is point (0.301, 0.689)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d36b21f963f5615.jpg", "conversations": [ { "from": "human", "value": "\nDoes white cotton shirt at center appear under rubberized red ring at upper center?" }, { "from": "gpt", "value": "Correct, white cotton shirt at center is located below rubberized red ring at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1527d418ed01cceb.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, green fabric jacket at center or matte green jacket at center?" }, { "from": "gpt", "value": "Positioned to the right is matte green jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f1a566b27cb9ffa.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect analyzing the spatial relationship between the orange brick building at lower left and the white fluffy cloud at upper left. Which object is positioned closer to the viewer?" }, { "from": "gpt", "value": "The white fluffy cloud at upper left is closer to the viewer because the orange brick building at lower left is behind it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/924796890de71d25.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped tie at center have a smaller size compared to black striped tie at center?" }, { "from": "gpt", "value": "No, striped tie at center is not smaller than black striped tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72723b2c484bd91a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte tree at upper center is positioned below white plastic boat at center?" }, { "from": "gpt", "value": "Actually, green matte tree at upper center is above white plastic boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72f63b9a66e39984.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.896, 0.633) or point (0.401, 0.573)?" }, { "from": "gpt", "value": "Positioned behind is point (0.896, 0.633)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe14b4a9d54380e2.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte red hoodie at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.465, 0.634)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4acac65c2c51c137.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer arriving at the Taco Bell restaurant and see both the shiny blue car at center and the metallic blue sedan at center in the parking lot. Which vehicle is closer to the entrance of the restaurant?" }, { "from": "gpt", "value": "The shiny blue car at center is closer to the entrance of the restaurant because it is in front of the metallic blue sedan at center, which is further away." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6558670d9bddbee.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, white cotton shirt at center or matte blue polo shirt at right, stands taller?" }, { "from": "gpt", "value": "matte blue polo shirt at right is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70d55d7eb1efc448.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker carrying a backpack and want to walk along the brown dirt path at center while avoiding the white fluffy dog at lower left. Can you walk on the path without stepping on the dog?" }, { "from": "gpt", "value": "The brown dirt path at center might be wider than white fluffy dog at lower left, so there is a possibility to walk on the path without stepping on the dog." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abbf41d612f707fd.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.468, 0.277) or (0.355, 0.433)?" }, { "from": "gpt", "value": "Point (0.355, 0.433) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b13c5d9f75e23bc.jpg", "conversations": [ { "from": "human", "value": "\nBetween beige stone palace at center and denim jacket at center, which one has more height?" }, { "from": "gpt", "value": "beige stone palace at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfa3555520f3c076.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.789, 0.412) less distant than point (0.147, 0.609)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e68bb35920fd2ba6.jpg", "conversations": [ { "from": "human", "value": "\nYou are a visitor at the zoo and you see the shiny black crocodile at center and the khaki cotton shirt at upper center. Which object is positioned higher in the image?" }, { "from": "gpt", "value": "The khaki cotton shirt at upper center is positioned higher in the image than the shiny black crocodile at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05b2f53f765cbee6.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of black matte shirt at center?" }, { "from": "gpt", "value": "The distance of black matte shirt at center from camera is 27.14 inches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/696898a8fd928278.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green grass at lower center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.464, 0.797)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/055303adf09ce477.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between green glossy car at center and camera." }, { "from": "gpt", "value": "green glossy car at center is 8.52 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3eaf787d59ca33b7.jpg", "conversations": [ { "from": "human", "value": "\nBetween blue satin shirt at center and striped tie at center, which one has less height?" }, { "from": "gpt", "value": "striped tie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf040acfa04bc441.jpg", "conversations": [ { "from": "human", "value": "\nWhere is wooden lattice at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.343, 0.433)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cc617a9a1d96b76.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the waterfall and see the greenish water at center and the gray rough stone at center. Which one takes up more space in the scene?" }, { "from": "gpt", "value": "The greenish water at center is bigger than the gray rough stone at center, so it takes up more space in the scene." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4015b0f9718e306a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer positioned at the white matte shirt at center. You want to take a photo of the man wearing a light gray tshirt with a star design and red shorts who is standing on the left side. How far do you need to move to get a clear shot of him?" }, { "from": "gpt", "value": "The man wearing a light gray tshirt with a star design and red shorts on the left side is 16.81 feet away from the white matte shirt at center. To capture a clear photo, you would need to move closer or adjust your camera lens to accommodate the distance of 16.81 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9635c76e88bb29e8.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte red sculpture at center and matte leather pillow at lower left, which one has more height?" }, { "from": "gpt", "value": "matte red sculpture at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2a9818ede78f834.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the metallic gray bench at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.317, 0.775)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f6ac1484b750e99.jpg", "conversations": [ { "from": "human", "value": "\nBetween green wrought iron gate at center and brick pavement at lower left, which one has more height?" }, { "from": "gpt", "value": "green wrought iron gate at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b9bd67ea35164a6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the brown sandy beach at lower center and want to reach the clear water at lower center. Which direction should you move to get to the water?" }, { "from": "gpt", "value": "The brown sandy beach at lower center is positioned under the clear water at lower center, so you should move upward to reach the clear water at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a227ed22b45d8a1d.jpg", "conversations": [ { "from": "human", "value": "\nDoes green glass spire at center appear on the left side of glassy steel skyscraper at upper left?" }, { "from": "gpt", "value": "In fact, green glass spire at center is to the right of glassy steel skyscraper at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d93011042c539325.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue cotton shirt at center is positioned below matte red coat at center?" }, { "from": "gpt", "value": "Correct, blue cotton shirt at center is located below matte red coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/376f7a9db0de8955.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the blue uniform at lower right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.904, 0.828)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a37b3345d27283d9.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black stroller at center shorter than white fabric bag at center?" }, { "from": "gpt", "value": "Yes, matte black stroller at center is shorter than white fabric bag at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f74fbc702c9cd5ad.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer planning to capture the entire view of the light brown bark tree at left and the smooth bark tree at center in a single frame. Based on their sizes in the image, which tree should you focus on to ensure both fit without cropping?" }, { "from": "gpt", "value": "The light brown bark tree at left occupies less space than the smooth bark tree at center, so focusing on the smooth bark tree at center will help ensure both trees fit in the frame since it takes up more space and can serve as the main subject while the smaller one remains visible." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6798087264d9e5dc.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green leafy tree at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.448, 0.244)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5119373128ee603d.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of matte red shirt at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.588, 0.603)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3274d0b9a72586ca.jpg", "conversations": [ { "from": "human", "value": "\nIs brown rough dirt track at lower right to the right of green matte tree at center from the viewer's perspective?" }, { "from": "gpt", "value": "Yes, brown rough dirt track at lower right is to the right of green matte tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b46fcaed91194da.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of green grassy at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.523, 0.792)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c2ebd083f02f525.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, black matte t-shirt at center or striped cotton shirt at left?" }, { "from": "gpt", "value": "striped cotton shirt at left is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/744dbb8e55674335.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black fabric jacket at upper left is positioned to the left of black matte jacket at left?" }, { "from": "gpt", "value": "No, black fabric jacket at upper left is not to the left of black matte jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9319ab2d152ebba.jpg", "conversations": [ { "from": "human", "value": "\nYou are setting up a charging station for two smartphones. You have a black matte smartphone at right and a slate gray metallic smartphone at center. According to the scene, which smartphone is positioned higher?" }, { "from": "gpt", "value": "The black matte smartphone at right is located above the slate gray metallic smartphone at center, so it is positioned higher." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d982501e74fb9a6b.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.541, 0.773) or (0.657, 0.652)?" }, { "from": "gpt", "value": "Point (0.541, 0.773)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b68e20e549f1fe9e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.351, 0.627) closer to camera compared to point (0.269, 0.439)?" }, { "from": "gpt", "value": "Yes, point (0.351, 0.627) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c4b25cfb732a15a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point with coordinates point (0.439, 0.641) and want to walk towards the point with coordinates point (0.544, 0.969). According to the scene description, which direction should you move to reach your destination?" }, { "from": "gpt", "value": "You should move forward because point (0.544, 0.969) is in front of point (0.439, 0.641)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c83eae15009d978f.jpg", "conversations": [ { "from": "human", "value": "\nPoint to green leafy tree at left.Point to the green leafy tree at left in the image." }, { "from": "gpt", "value": "[(0.169, 0.747)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7bc3c5da78d7f0f.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.522, 0.759)?" }, { "from": "gpt", "value": "clear water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a99f9179831cdbeb.jpg", "conversations": [ { "from": "human", "value": "\nBetween white matte snowboard at center and black matte boot at lower center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, white matte snowboard at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fba9b5fc33dea642.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.907, 0.000) in the image. You want to pick up the watercolor palette on the right. How far is the palette from your current position?" }, { "from": "gpt", "value": "The point (0.907, 0.000) is 29.20 inches away from the viewer, so the watercolor palette on the right is 29.20 inches away from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbadc53ae18e77e6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the gathering and want to hand a drink to the person wearing the green matte shirt at center. How far do you need to walk to reach them?" }, { "from": "gpt", "value": "The green matte shirt at center is 3.37 meters away from the viewer, so you need to walk approximately 3.37 meters to reach them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23fdf9a44e493dab.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.630, 0.570) from camera?" }, { "from": "gpt", "value": "The distance of point (0.630, 0.570) from camera is 290.18 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2335f0c681dcb68a.jpg", "conversations": [ { "from": "human", "value": "\nBetween black fleece jacket at right and knitted sweater at left, which one has more height?" }, { "from": "gpt", "value": "With more height is black fleece jacket at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/467b2f25d5a40616.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the office and want to reach a specific point marked at coordinates point (0.000, 0.745). How far is this point from you?" }, { "from": "gpt", "value": "The distance of point (0.000, 0.745) from the viewer is 2.58 meters, so the point is 2.58 meters away." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d0c8edae16fd5d6.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.567, 0.122) positioned behind point (0.881, 0.498)?" }, { "from": "gpt", "value": "No, (0.567, 0.122) is in front of (0.881, 0.498)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3743c76c89e652ae.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.497, 0.630) or (0.339, 0.773)?" }, { "from": "gpt", "value": "Point (0.339, 0.773) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/420f2726408d37fd.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the smooth bark tree trunk at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.939, 0.264)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afccce6ec83d0cf6.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.516, 0.819) or point (0.740, 0.178)?" }, { "from": "gpt", "value": "Point (0.516, 0.819)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d10d8228f84cd3d5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tour guide explaining the coastal town to visitors. You mention the blue water at center and the white glossy boat at center. How far apart are these two landmarks?" }, { "from": "gpt", "value": "The blue water at center is 41.72 meters from the white glossy boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/599c121790a37a60.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any knitted wool scarf at center in the image." }, { "from": "gpt", "value": "[(0.362, 0.480)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5a2102ff0f49894.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.786, 0.295) and camera?" }, { "from": "gpt", "value": "Point (0.786, 0.295) is 1.26 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2ee03aabd2b6435.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.960, 0.103) and point (0.656, 0.441), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.656, 0.441) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a5935469b424752.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to decide which shirt to wear for a photoshoot. The white linen shirt at left is more breathable than the white textured shirt at left. Which shirt should you choose if you want something lighter and cooler?" }, { "from": "gpt", "value": "The white linen shirt at left is thinner than the white textured shirt at left, so it is lighter and cooler, making it the better choice for the photoshoot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1bba2f07a78b9ea6.jpg", "conversations": [ { "from": "human", "value": "\nLocate all stained glass balcony at upper right in the image." }, { "from": "gpt", "value": "[(0.720, 0.322)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1895afedf31d474e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, green leafy tree at center or green leafy tree at left?" }, { "from": "gpt", "value": "Positioned lower is green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f35293e0df75094b.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between white fur dog at left and camera?" }, { "from": "gpt", "value": "They are 53.33 centimeters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ab6ebecaa4b2f97.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.029, 0.069) to camera." }, { "from": "gpt", "value": "5.16 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eee42b4d87c54fa9.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.113, 0.797)?" }, { "from": "gpt", "value": "denim jacket at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3df5425e7638de21.jpg", "conversations": [ { "from": "human", "value": "\nLocate the floral dress at center in the image." }, { "from": "gpt", "value": "[(0.278, 0.412)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3020cc0bae5eaf0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black jacket at center is wider than purple matte business suit at upper center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1eec21d8ff6acc3.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the black matte hair at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.820, 0.606)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1816f47770706f54.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of a laundromat and need to reach the brushed metal washing machine at center. How far away is it from your current position?" }, { "from": "gpt", "value": "The brushed metal washing machine at center is 2.36 meters away from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcfa179aee312ac5.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.899, 0.767) or (0.546, 0.056)?" }, { "from": "gpt", "value": "The point (0.546, 0.056) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/755843bc101aefe9.jpg", "conversations": [ { "from": "human", "value": "\nYou are taking a photo of the edcamp poster and notice two points on the poster. One is at coordinate point (0.320, 0.945) and the other is at point (0.010, 0.905). Which point is closer to the bottom edge of the poster?" }, { "from": "gpt", "value": "Point (0.010, 0.905) is closer to the bottom edge of the poster because it has a smaller y coordinate value compared to point (0.320, 0.945)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f96b826779bee146.jpg", "conversations": [ { "from": "human", "value": "\nHow far is green textured bikini top at center from clear plastic goggles at center?" }, { "from": "gpt", "value": "The distance of green textured bikini top at center from clear plastic goggles at center is 1.03 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60716dc5f7f190c3.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.136, 0.809) and camera." }, { "from": "gpt", "value": "Point (0.136, 0.809) and camera are 34.66 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/141f1e37fc34c22e.jpg", "conversations": [ { "from": "human", "value": "\nLocate the pink glossy text at upper center in the image." }, { "from": "gpt", "value": "[(0.664, 0.483)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/189e3c6facca854c.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between dark blue uniform at center and camera." }, { "from": "gpt", "value": "dark blue uniform at center is 1.55 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a023fb10ea9e1db.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect analyzing the spatial relationships in the scene. Based on the image, which of the two brick churches, the brick church at center or the matte brick church at upper center, appears closer to the viewer?" }, { "from": "gpt", "value": "The brick church at center appears closer to the viewer because it is taller than the matte brick church at upper center, indicating it is positioned in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dca62b79c15a639c.jpg", "conversations": [ { "from": "human", "value": "\nIs tan wool suit at right bigger than black satin suit at center?" }, { "from": "gpt", "value": "No, tan wool suit at right is not bigger than black satin suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d63236e9946b1738.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of yellow plastic tape at lower center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.347, 0.844)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7366b0cdf4d786e6.jpg", "conversations": [ { "from": "human", "value": "\nYou are a guest at this event and need to place a small gift on the table without blocking the view of the text on the tablecloth. Considering the size of the black glossy table at center and the graywoollybeard at center, where should you place the gift?" }, { "from": "gpt", "value": "The black glossy table at center is bigger than the graywoollybeard at center, so placing the gift on the black glossy table at center would ensure it doesn" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc870f258efed292.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.864, 0.216) and camera?" }, { "from": "gpt", "value": "38.01 inches" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fe114888601c199.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of black matte shirt at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.204, 0.670)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7793a282aa9bb33a.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.429, 0.981) in front of point (0.787, 0.783)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.787, 0.783)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e8f9d5fdf182eda.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear glass window at center appear on the right side of yellow painted wood sign at center?" }, { "from": "gpt", "value": "Correct, you'll find clear glass window at center to the right of yellow painted wood sign at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afbb8c4d84c6be59.jpg", "conversations": [ { "from": "human", "value": "\nYou are a sports analyst watching the game. You notice two items in the image, the matte silver helmet at center and the black striped shirt at upper center. Which of these two items appears narrower in the image?" }, { "from": "gpt", "value": "The matte silver helmet at center appears narrower than the black striped shirt at upper center because its width is less than the shirt." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d4af39a603add44.jpg", "conversations": [ { "from": "human", "value": "\nPoint to pinstriped suit at center.Point to the pinstriped suit at center in the image." }, { "from": "gpt", "value": "[(0.080, 0.434)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad177c746b7528ba.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.694, 0.427) or (0.566, 0.517)?" }, { "from": "gpt", "value": "Point (0.694, 0.427) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0affc87953a1b6c.jpg", "conversations": [ { "from": "human", "value": "\nIs glossy plastic headlight at center wider than satin white sedan at center?" }, { "from": "gpt", "value": "No, glossy plastic headlight at center is not wider than satin white sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cce0a8871bc27881.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the greenish-blue water at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.458, 0.764)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb48d21237b9474f.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white matte shorts at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.668, 0.580)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e59eabff1fcdfcb3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, brown wooden stool at lower center or white fluffy dog at center?" }, { "from": "gpt", "value": "Positioned higher is white fluffy dog at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a1621372e29ed90.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a photo of the dark blue jeans at center and the dark gray fabric jacket at center. Since you want to ensure both are in focus, you need to know which one is taller. Can you tell me which one is taller?" }, { "from": "gpt", "value": "The dark blue jeans at center is taller than the dark gray fabric jacket at center according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fcc0a69475de131.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.129, 0.611) and point (0.478, 0.438), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.129, 0.611) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/797cef93592a920e.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte dress at lower left wider than white matte shirt at upper center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f15546992566c42.jpg", "conversations": [ { "from": "human", "value": "\nHow far apart are brown furry animal at center and teal fleece jacket at center?" }, { "from": "gpt", "value": "brown furry animal at center is 50.40 centimeters away from teal fleece jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21a0fbcfefef6d7c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of denim jacket at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.443, 0.720)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6d09a0f810b34e9.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white sand man at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.351, 0.597)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/941c52238001cf05.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of concrete bridge at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.740, 0.512)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64620c768af87510.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.623, 0.827) from camera?" }, { "from": "gpt", "value": "Point (0.623, 0.827) is 18.30 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8f802ed29002d71.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of golden fur dog at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.281, 0.713)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23f4a29b45c57e47.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.915, 0.362) or (0.186, 0.928)?" }, { "from": "gpt", "value": "Point (0.915, 0.362) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce681947237ff79b.jpg", "conversations": [ { "from": "human", "value": "\nIs white/kimono/jiu-jitsu gi at center above white textured kimono at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62b50c0d5c29a7d2.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte brown vest at left lie behind gray fuzzy beard at center?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bd58665da092413.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy at center closer to the viewer compared to black feathered ostrich at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de1e0404f99cb194.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a matte gray jacket at right. Pinpoint a point to the matte gray jacket at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.815, 0.636)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d76f2dc0b725db5.jpg", "conversations": [ { "from": "human", "value": "\nIs red rubber fish at right positioned before white cotton shirt at center?" }, { "from": "gpt", "value": "Yes, it is in front of white cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a366cb34cdd0cf5c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a sailor on the white matte ferry at right, and you want to know the distance between your ferry and the blue water at center to ensure safe navigation. What is the distance between them?" }, { "from": "gpt", "value": "The blue water at center is 14.95 meters from the white matte ferry at right, so the distance between them is 14.95 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36beb29cf6523440.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.897, 0.764) and camera?" }, { "from": "gpt", "value": "They are 107.55 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1eaf5c8f8d5347a.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the sunglasses at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.773, 0.628)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8dcec856c81be066.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the black metallic truck at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.888, 0.512)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ad6605d580c720f.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the black matte blazer at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.698, 0.627)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32de6347a8b47aad.jpg", "conversations": [ { "from": "human", "value": "\nIs orange fabric figure at center positioned in front of yellow cotton shirt at center?" }, { "from": "gpt", "value": "Yes, orange fabric figure at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1341e0694194183.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing 30 inches away from the pink matte shirt at center. You want to take a photo of the matte black sunglasses at upper left without moving your position. Can you reach the sunglasses with your camera lens?" }, { "from": "gpt", "value": "The pink matte shirt at center is 28.07 inches away from the matte black sunglasses at upper left. Since you are 30 inches away from the pink matte shirt at center, the matte black sunglasses at upper left would be approximately 30 inches minus 28.07 inches equals 1.93 inches away from you. Therefore, you can reach the matte black sunglasses at upper left with your camera lens as they are within your current position range." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf4ae96f39ab10fb.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden at center appear on the right side of gray suit at center?" }, { "from": "gpt", "value": "Yes, wooden at center is to the right of gray suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ed269d311a197e0.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.794, 0.764) and point (0.661, 0.662), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.661, 0.662) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/778e48cfa898232e.jpg", "conversations": [ { "from": "human", "value": "\nBetween white matte shirt at center and matte white head at lower center, which one has less height?" }, { "from": "gpt", "value": "matte white head at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/216ab92aaba3a621.jpg", "conversations": [ { "from": "human", "value": "\nIs rough brown shirt at center positioned at the back of brown wooden chair at left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6637863cbd153ee1.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.572, 0.447) less distant than point (0.917, 0.411)?" }, { "from": "gpt", "value": "Yes, point (0.572, 0.447) is in front of point (0.917, 0.411)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c54b991453551ee7.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.381, 0.627) and point (0.612, 0.731), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.612, 0.731)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee7c30484cdc2e29.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.522, 0.463) or (0.425, 0.830)?" }, { "from": "gpt", "value": "The point (0.522, 0.463) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51399de3fea2a0b2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tour guide leading a group through the art gallery. You need to move from the navy blue blazer at right to the matte black frame at upper left. Is the distance between them sufficient to accommodate a 2.5 meter long tour guide pole you are holding?" }, { "from": "gpt", "value": "The navy blue blazer at right and matte black frame at upper left are 2.27 meters apart, which is shorter than the 2.5 meter tour guide pole. Therefore, the pole cannot fit between them without overlapping." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10cdc229466a01e0.jpg", "conversations": [ { "from": "human", "value": "\nIs black metal fence at center bigger than white matte tank top at center?" }, { "from": "gpt", "value": "Yes, black metal fence at center is bigger than white matte tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f212549c5a6bb487.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.519, 0.050) or (0.216, 0.431)?" }, { "from": "gpt", "value": "The point (0.216, 0.431) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5cfe3f5e70fc703a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the winter sports event. You want to take a photo of the white glossy snowboarder at center without any obstructions. Is the metallic gray building at upper center blocking your view of the snowboarder?" }, { "from": "gpt", "value": "The white glossy snowboarder at center is behind the metallic gray building at upper center, so the building is blocking the view of the snowboarder." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d236be9da5eeec69.jpg", "conversations": [ { "from": "human", "value": "\nIs black leather armchair at lower left thinner than black leather chair at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1fd6050e791926ab.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the cobblestone street and want to take a photo of the green leafy tree at left. If your camera has a maximum focus range of 15 feet, will you need to move closer to the tree to get a clear shot?" }, { "from": "gpt", "value": "The green leafy tree at left is 16.98 feet away from you, which exceeds your camera maximum focus range of 15 feet. You need to move closer to the tree to get a clear shot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45d51e11d4ff1a85.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white smooth garage door at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.814, 0.588)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b1be6ae2a672ad5.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the transparent glass door at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.404, 0.336)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ad8e6f6a85b8974.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.371, 0.233) in front of point (0.069, 0.463)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f77574216665add.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position in the urban railway scene. There is a point marked at coordinates point (0.335, 0.431). How far is this point from your current position?" }, { "from": "gpt", "value": "The point (0.335, 0.431) is 105.10 meters away from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41e09870f3ce428e.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.233, 0.511)." }, { "from": "gpt", "value": "matte black shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/929b5339d8b6f24c.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.676, 0.600)?" }, { "from": "gpt", "value": "silhouette fabric jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0cf2efc4ec4a2a7.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.486, 0.281) and point (0.742, 0.977), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.742, 0.977) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5a6aa243807aaa0.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, plaid shirt at lower right or gray hair at center?" }, { "from": "gpt", "value": "plaid shirt at lower right is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/765cf3d67077f2ad.jpg", "conversations": [ { "from": "human", "value": "\nBetween white matte church at center and purple matte flower at right, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "white matte church at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f964ccf047af528a.jpg", "conversations": [ { "from": "human", "value": "\nLocate all velvet black coat at center in the image." }, { "from": "gpt", "value": "[(0.157, 0.655)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7dad71e31157ae25.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between matte pink shirt at left and camera?" }, { "from": "gpt", "value": "They are 7.78 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b58e8a84fc67dcaf.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, plaid cotton dress at left or green plaid dress at left?" }, { "from": "gpt", "value": "With less height is green plaid dress at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42d14d3350167820.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of dark gray jacket at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.982, 0.384)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec0d4d0bd36a61b1.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the matte black wheelchair at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.510, 0.647)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90ba25b73f6f724b.jpg", "conversations": [ { "from": "human", "value": "\nLocate the white matte signboard at center in the image." }, { "from": "gpt", "value": "[(0.539, 0.714)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/579514660fc72c9d.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of white fabric jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.463, 0.831)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf43d386de0c74de.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth skin at upper center further to camera compared to black matte shirt at center?" }, { "from": "gpt", "value": "No, it is in front of black matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06540b89b853eb66.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper left is positioned above metallic stairwell at center?" }, { "from": "gpt", "value": "Correct, green leafy tree at upper left is located above metallic stairwell at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/400ede959f0a482d.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.467, 0.972) or (0.166, 0.675)?" }, { "from": "gpt", "value": "Point (0.166, 0.675)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6f8c873cf8a0e47.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the orange matte sign at upper center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.546, 0.239)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef563846fb6f7796.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.269, 0.527) closer to camera compared to point (0.684, 0.492)?" }, { "from": "gpt", "value": "Yes, point (0.269, 0.527) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f08f746142e058ee.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.722, 0.297)?" }, { "from": "gpt", "value": "floral bouquet at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7b14a7f5d8dcfa0.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in a South Korean street scene and see the red fabric baby carriage at lower right. If you want to take a closer look at the carriage without moving your position, how far should you extend your arm to reach it?" }, { "from": "gpt", "value": "The red fabric baby carriage at lower right is 33.02 inches away from the camera, so you would need to extend your arm approximately 33.02 inches to reach it while staying in your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2843ed60eb3b352.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator trying to locate a person in a rural area. You see the camo uniform at right and the brown dirt field at lower left. Which object is positioned higher in the image?" }, { "from": "gpt", "value": "The camo uniform at right is located above the brown dirt field at lower left, so the camo uniform at right is higher in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17adcac1b97c5ac0.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the origin point of a coordinate system placed over the image. The origin is at the bottom left corner of the image. The x and y axes increase to the right and upwards respectively. You want to walk to the gray concrete pavement at center. Which direction should you move in terms of x and y coordinates?" }, { "from": "gpt", "value": "To reach the gray concrete pavement at center located at coordinates point (0.463, 0.722), you should move in the positive x and positive y direction since the x and y values are greater than the origin at (0.000, 0.000)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fae05c0c21bdb426.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point at coordinates point (0.516, 0.528). If you can walk 10 feet per minute, how long will it take you to reach there?" }, { "from": "gpt", "value": "The distance between point (0.516, 0.528) and the camera is 11.53 feet. Since you walk at 10 feet per minute, it will take approximately 1.15 minutes to reach the point." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87aa8888001c575d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white marble statue at center is positioned above purple hoodie at lower right?" }, { "from": "gpt", "value": "Yes, white marble statue at center is above purple hoodie at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82a942a49d29e1f9.jpg", "conversations": [ { "from": "human", "value": "\nWhere is fluffy beige dog at right located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.901, 0.403)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a26eeee7a63b61c.jpg", "conversations": [ { "from": "human", "value": "\nIs brown cardboard at center taller than metallic silver pen at lower center?" }, { "from": "gpt", "value": "Correct, brown cardboard at center is much taller as metallic silver pen at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea015a91ca13f781.jpg", "conversations": [ { "from": "human", "value": "\nIs black cotton pants at lower center wider than black leather jacket at upper center?" }, { "from": "gpt", "value": "In fact, black cotton pants at lower center might be narrower than black leather jacket at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d46a086191c2def1.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the room and want to hand a gift to the person wearing the white striped sweater at center. How far should you walk forward to reach them?" }, { "from": "gpt", "value": "The white striped sweater at center is 7.93 feet away from the camera, so you need to walk forward approximately 7.93 feet to reach them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c231196f364e8a67.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown fluffy alpaca at center appear under green grass at upper center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96c15814d0e3a0e4.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.034, 0.517) positioned in front of point (0.560, 0.222)?" }, { "from": "gpt", "value": "Yes, point (0.034, 0.517) is in front of point (0.560, 0.222)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/682813dae6b6905c.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.681, 0.756) and point (0.208, 0.716), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.208, 0.716)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/752e72016c675619.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if velvet blue costume at center is shorter than green plaid shirt at center?" }, { "from": "gpt", "value": "No, velvet blue costume at center is not shorter than green plaid shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed0ec97749d124b6.jpg", "conversations": [ { "from": "human", "value": "\nYou are an event planner arranging seating for a presentation. There is a smooth black suit at center marked by point (0.707, 0.677). Where should you place the speaker so they can be seen clearly by the audience?" }, { "from": "gpt", "value": "The speaker should be positioned in front of the smooth black suit at center marked by point (0.707, 0.677) to ensure they are visible to the audience." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3eafa84c454a03f.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown fabric shirt at center come behind matte orange shirt at left?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11f85583563843b4.jpg", "conversations": [ { "from": "human", "value": "\nBetween black glossy refrigerator at left and white ceramic sink at center, which one has less height?" }, { "from": "gpt", "value": "With less height is white ceramic sink at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6afcba46526800c1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.669, 0.483)?" }, { "from": "gpt", "value": "black plastic glasses at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/214161d43b010649.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of green leafy tree at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.877, 0.841)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bd8e0a670eee4d2.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the dirt track at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.513, 0.902)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2804375f37e705fa.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black trophy at center to the left of purple cotton shorts at right from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, matte black trophy at center is positioned on the left side of purple cotton shorts at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77db917709c733b3.jpg", "conversations": [ { "from": "human", "value": "\nYou are a passenger in the vehicle and want to know which of the two points, point (0.641, 0.181) or point (0.298, 0.458), is closer to the camera. Based on the scene description, can you determine which point is closer?" }, { "from": "gpt", "value": "Point (0.298, 0.458) is closer to the camera than point (0.641, 0.181), as the description states that point (0.641, 0.181) is further away." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2033a221fad0d7e.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the matte black podium at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.693, 0.231)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/347d4a41650f90de.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the bronze statue at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.270, 0.506)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37d695e8fa3ab6cc.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to park your 1.8 meters tall box in the space between the shiny black sedan at center and the matte silver sedan at center. Can the box fit vertically between them?" }, { "from": "gpt", "value": "The shiny black sedan at center is taller than the matte silver sedan at center. The height difference means the space between them might not be consistent. However, since the box is 1.8 meters tall, and the shorter matte silver sedan at center is likely under that height, the box may not fit vertically if the lower part of the space is constrained by the sedans." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e803d068cb0580fd.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to dirt path at center? Please provide its 2D coordinates.Where can I find dirt path at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.593, 0.830)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31bc97e59b93ff64.jpg", "conversations": [ { "from": "human", "value": "\nLocate green leafy tree at center in the image." }, { "from": "gpt", "value": "[(0.522, 0.306)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e07a41880e990718.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of an old stone building and notice a green leafy bush at left and a dark gray stone chimney at upper left. Which object is nearer to you?" }, { "from": "gpt", "value": "The green leafy bush at left is closer to the viewer than the dark gray stone chimney at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62eaa4335421d256.jpg", "conversations": [ { "from": "human", "value": "\nIs purple matte car at center shorter than white matte shirt at center?" }, { "from": "gpt", "value": "Incorrect, purple matte car at center's height does not fall short of white matte shirt at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/685b870afa41fb2e.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth black hat at upper center have a greater height compared to black glossy photo of man at center?" }, { "from": "gpt", "value": "Indeed, smooth black hat at upper center has a greater height compared to black glossy photo of man at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59a7c5d74a7020ef.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.659, 0.953) or (0.147, 0.863)?" }, { "from": "gpt", "value": "Point (0.659, 0.953) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcbea6cb81fe4084.jpg", "conversations": [ { "from": "human", "value": "\nYou are an ice hockey player trying to pass the puck to a teammate. You have two points marked on the ice at coordinates point (0.420, 0.525) and point (0.671, 0.808). Which point is closer to you, the player?" }, { "from": "gpt", "value": "Point (0.420, 0.525) is closer to you because it is further to the viewer than point (0.671, 0.808), meaning it is nearer to your position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2895ac659e97517c.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.545, 0.627)?" }, { "from": "gpt", "value": "white satin veil at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/215fdadcfb00bb15.jpg", "conversations": [ { "from": "human", "value": "\nDoes satin black phone at center have a smaller size compared to matte black phone at center?" }, { "from": "gpt", "value": "Yes, satin black phone at center is smaller than matte black phone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a18acd3d86ffec6.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of black leather jacket at center in the image." }, { "from": "gpt", "value": "[(0.315, 0.787)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0222d9709075b5c9.jpg", "conversations": [ { "from": "human", "value": "\nPoint to white paper at lower center.Point to the white paper at lower center in the image." }, { "from": "gpt", "value": "[(0.600, 0.891)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01bed4e4d7473a8d.jpg", "conversations": [ { "from": "human", "value": "\nYou are an event photographer in a conference room. You need to capture a photo of the gray matte suit at left and the matte black hand at center. Based on their positions, which object is positioned higher in the image?" }, { "from": "gpt", "value": "The gray matte suit at left is above the matte black hand at center, so it is positioned higher in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f4e522982a8221a.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.090, 0.769)?" }, { "from": "gpt", "value": "smooth concrete pavement at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3a3967bb9f7a32d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the group photo of the dark blue shirt at center and dark blue polo shirt at center. Which one is positioned to the right side of the other?" }, { "from": "gpt", "value": "The dark blue shirt at center is positioned to the right of the dark blue polo shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35eae15563a57cbc.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the clear blue water at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.504, 0.125)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c7887148fbd3677.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.259, 0.522) come in front of point (0.128, 0.423)?" }, { "from": "gpt", "value": "Yes, point (0.259, 0.522) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7444c97cbb3a95a7.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of matte black tank top at left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.244, 0.566)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed6f12f8c2a10d5c.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between metallic silver eagle at center and camera." }, { "from": "gpt", "value": "337.21 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/440babea77305b6a.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.661, 0.316) or (0.023, 0.647)?" }, { "from": "gpt", "value": "Point (0.661, 0.316)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a46e2a45156dfaf4.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, green leafy tree at left or rustic stone archway at center?" }, { "from": "gpt", "value": "rustic stone archway at center is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bad6d6f691e58f01.jpg", "conversations": [ { "from": "human", "value": "\nLocate the brown suede jacket at center in the image." }, { "from": "gpt", "value": "[(0.241, 0.639)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb5a7e8c6a33f23f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who wants to take a photo of both the green textured pine tree at center and the green leafy tree at upper left in the same frame. Given that your camera has a maximum focal length of 50 meters, can you capture both trees in a single shot without moving your position?" }, { "from": "gpt", "value": "The green textured pine tree at center and the green leafy tree at upper left are 30.49 meters apart from each other. Since the distance between them is within the camera maximum focal length of 50 meters, you can capture both trees in a single shot without moving your position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d1399074db2fac8.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the corridor and see a black plastic sign at center and a light blue shirt at center. Which object is closer to your right side?" }, { "from": "gpt", "value": "The light blue shirt at center is closer to your right side because the black plastic sign at center is positioned on the left side of it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e644fdb49c969bb0.jpg", "conversations": [ { "from": "human", "value": "\nBetween dark blue suit at center and pink fabric shirt at right, which one is positioned lower?" }, { "from": "gpt", "value": "pink fabric shirt at right is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cc9c683df8b9e51.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to rustic wood deck at center? Please provide its 2D coordinates.Where can I find rustic wood deck at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.619, 0.897)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f41603eb77d07cf6.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of carved stone lion at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.475, 0.281)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfa126687008877f.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a light brown textured shirt at center. Pinpoint a point to the light brown textured shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.556, 0.578)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8a4cf075007118c.jpg", "conversations": [ { "from": "human", "value": "\nLocate the white smooth flag pole at center in the image." }, { "from": "gpt", "value": "[(0.559, 0.478)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df390b1157576bb9.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a photo of the green floral dress at center and the smooth gray rock at center. Based on their positions, which object should you adjust your camera focus to first if you want to ensure both are in the frame?" }, { "from": "gpt", "value": "The green floral dress at center is to the left of smooth gray rock at center, so you should focus on the green floral dress at center first to ensure both are in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/038779a6a99b8fe4.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, plaid fabric shirt at center or gray fabric jacket at center?" }, { "from": "gpt", "value": "Standing shorter between the two is plaid fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b046c1aaaf596b4.jpg", "conversations": [ { "from": "human", "value": "\nLocate the gray wool suit at center in the image." }, { "from": "gpt", "value": "[(0.738, 0.495)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa90182569a7dafb.jpg", "conversations": [ { "from": "human", "value": "\nBetween metallic stainless steel counter top at center and white glossy toilet paper at upper right, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "white glossy toilet paper at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3abb3abad97caef8.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between black murky water at upper center and camera?" }, { "from": "gpt", "value": "black murky water at upper center is 24.13 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0d681c4c7532005.jpg", "conversations": [ { "from": "human", "value": "\nIs black fleece jacket at center shorter than orange fleece jacket at right?" }, { "from": "gpt", "value": "Yes, black fleece jacket at center is shorter than orange fleece jacket at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/974bfde6b2facd8b.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.323, 0.344) and point (0.292, 0.644), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.323, 0.344) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f2eae05bc2fe271.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.808, 0.483) and camera." }, { "from": "gpt", "value": "Point (0.808, 0.483) is 5.92 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef66aac8dd541c07.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.307, 0.578) come behind point (0.832, 0.969)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13363a4a484c76ba.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of blue cotton shirt at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.804, 0.594)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2fa7a71e69f4076.jpg", "conversations": [ { "from": "human", "value": "\nYou are a parent trying to decide which play equipment is safer for your child to climb. The smooth plastic slide at left and the matte pink railing at center are both options. Based on their height, which one would be more appropriate for a child who is 1.2 meters tall?" }, { "from": "gpt", "value": "The matte pink railing at center is shorter than the smooth plastic slide at left. Since the child is 1.2 meters tall, the railing might be a safer option as it is lower to the ground and easier for the child to manage." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0408d9d35cd2437d.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of white painted wood gazebo at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.754, 0.589)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4edf767732d58eeb.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of golden feathered rooster at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.515, 0.562)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d612e9a48afdb84.jpg", "conversations": [ { "from": "human", "value": "\nIs knitted fabric at center below soft fur cat at left?" }, { "from": "gpt", "value": "Yes, knitted fabric at center is below soft fur cat at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11c049d03c9b357d.jpg", "conversations": [ { "from": "human", "value": "\nPlease describe the position of the white soft flatbread at center relative to the other items on the banana leaf." }, { "from": "gpt", "value": "The white soft flatbread at center is located at the central part of the banana leaf, positioned at coordinates approximately 0.725 along the x axis and 0.506 along the y axis." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/053ea75af199a99a.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, white glossy van at center or green fabric shirt at left?" }, { "from": "gpt", "value": "Standing shorter between the two is green fabric shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0ea16a8715d9d29.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist painting this landscape. You want to ensure the foggy blue mountain at center and the dull green trees at center are positioned correctly. According to the scene description, which object should be placed higher in your painting?" }, { "from": "gpt", "value": "The foggy blue mountain at center should be placed higher in the painting since it is located above the dull green trees at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83edf889737d5596.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who wants to cross the gray stone river at center. You notice a green leafy tree at upper center nearby. Which one is wider in terms of their spread? Please answer based on their widths." }, { "from": "gpt", "value": "The green leafy tree at upper center is wider than the gray stone river at center because its width surpasses the river." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c927e7df1ce21a0.jpg", "conversations": [ { "from": "human", "value": "\nCould you measure the distance between brass clock face at upper left and metallic silver street sign at center?" }, { "from": "gpt", "value": "33.55 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b877509ebfd4a97c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue mosaic tiles at center is positioned to the left of blue mosaic tile swimming pool at center?" }, { "from": "gpt", "value": "No, blue mosaic tiles at center is not to the left of blue mosaic tile swimming pool at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4dc0ece5efc10fb9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, translucent plastic heart at center or translucent rubber toy at center, stands shorter?" }, { "from": "gpt", "value": "Standing shorter between the two is translucent plastic heart at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63aafcb90335e91c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture both the bronze statue at left and the black feathered pigeon at lower left in a single frame. Given their sizes, which object should you focus on first to ensure both are in focus?" }, { "from": "gpt", "value": "The bronze statue at left is larger than the black feathered pigeon at lower left, so you should focus on the bronze statue at left first to ensure both are in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15d89a3756a1ab46.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, smooth stone alley at center or white paper sign at center, stands taller?" }, { "from": "gpt", "value": "With more height is white paper sign at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b1ad677266b6741.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of green matte tree at upper left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.226, 0.269)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4064c1602435de9b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the gray wool scarf at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.769, 0.283)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45362ba868479680.jpg", "conversations": [ { "from": "human", "value": "\nPoint to green fabric curtain at left.Point to the green fabric curtain at left in the image." }, { "from": "gpt", "value": "[(0.058, 0.237)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/654499ca538d667a.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.855, 0.502) and point (0.730, 0.816), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.730, 0.816) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3211d9f98b8ae67c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.647, 0.258) or point (0.422, 0.589)?" }, { "from": "gpt", "value": "The point (0.647, 0.258) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47b09b34e24b4039.jpg", "conversations": [ { "from": "human", "value": "\nLocate all yellow matte bus at center in the image." }, { "from": "gpt", "value": "[(0.501, 0.520)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc020a53b8b8e6db.jpg", "conversations": [ { "from": "human", "value": "\nBetween green leafy tree at upper center and stone/brick palace at center, which one has more height?" }, { "from": "gpt", "value": "Standing taller between the two is green leafy tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8970a4c68fc0ac8.jpg", "conversations": [ { "from": "human", "value": "\nPoint to velvet black jacket at center.Point to the velvet black jacket at center in the image." }, { "from": "gpt", "value": "[(0.741, 0.838)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d10577fd74c3baa.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white cotton shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.710, 0.623)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be2cdbafae3dbe51.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of dark brown leather jacket at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.583, 0.398)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4390bb9b192b6c10.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.258, 0.761) or (0.658, 0.427)?" }, { "from": "gpt", "value": "The point (0.658, 0.427) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01013a96ab205fe4.jpg", "conversations": [ { "from": "human", "value": "\nPoint to silver metallic tower at center-right.Point to the silver metallic tower at center-right in the image." }, { "from": "gpt", "value": "[(0.707, 0.584)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fef84653a48d409f.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of rocky brown mountain at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.537, 0.359)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca5ad95fc29cbb08.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of white matte pickup truck at center?" }, { "from": "gpt", "value": "white matte pickup truck at center and camera are 2.87 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd1e2908e3e46395.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, pink fabric shirt at center or purple fabric blouse at center?" }, { "from": "gpt", "value": "purple fabric blouse at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46f9eae49cc37ef8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.172, 0.405)?" }, { "from": "gpt", "value": "purple fleece jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ad10ed85c5f75de.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of natural wood hut at center less distant than that of wooden at center?" }, { "from": "gpt", "value": "Yes, natural wood hut at center is in front of wooden at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ea8b81088da5b62.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden picture frame at center is taller than black ink signature at center?" }, { "from": "gpt", "value": "Indeed, wooden picture frame at center has a greater height compared to black ink signature at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8622e1bba34081a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.309, 0.706) or point (0.653, 0.436)?" }, { "from": "gpt", "value": "The point (0.653, 0.436) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/283d042a35f2d367.jpg", "conversations": [ { "from": "human", "value": "\nLocate the smooth wooden balcony at center in the image." }, { "from": "gpt", "value": "[(0.287, 0.573)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df2713deb03f1ac3.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture both girls in a single frame. Since the multicolored fabric swimsuit at center and pink fabric swimsuit at center are both at the center, which swimsuit will require more space in the frame to accommodate its width?" }, { "from": "gpt", "value": "The multicolored fabric swimsuit at center requires more space in the frame because its width surpasses that of the pink fabric swimsuit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74ede96691eb5a3b.jpg", "conversations": [ { "from": "human", "value": "\nDoes marble at center appear over brown woolen jacket at lower left?" }, { "from": "gpt", "value": "No, marble at center is not above brown woolen jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10aca14f8c5cdaa8.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of smooth sand bear at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.560, 0.573)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47a6ceb589db797e.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.806, 0.711)?" }, { "from": "gpt", "value": "black matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e402acd9aa1a6899.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a jeans at lower left. Pinpoint a point to the jeans at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.176, 0.616)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd806ea583217f61.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.517, 0.486)?" }, { "from": "gpt", "value": "matte gray shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88bd6b7f65c5a0a0.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.631, 0.525) or point (0.782, 0.686)?" }, { "from": "gpt", "value": "Positioned in front is point (0.782, 0.686)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8dafa2e2b21bd209.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte tattoo at upper center is positioned to the left of brown textured tattoo at upper right?" }, { "from": "gpt", "value": "Indeed, matte tattoo at upper center is positioned on the left side of brown textured tattoo at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9795723f8f75b164.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.465, 0.591) and camera?" }, { "from": "gpt", "value": "A distance of 95.03 meters exists between point (0.465, 0.591) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bdd3b2bba270996.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white picket fence at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.115, 0.741)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/686691b805217150.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of white fluffy cloud at upper center from camera?" }, { "from": "gpt", "value": "The distance of white fluffy cloud at upper center from camera is 2.56 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f380b7c821b41787.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to park your shiny blue car at center in a parking spot that can only accommodate vehicles smaller than the metallic blue car at center. Can your car fit in the spot?" }, { "from": "gpt", "value": "The shiny blue car at center occupies less space than the metallic blue car at center, so yes, the delivery person can park their shiny blue car at center in the spot since it is smaller than the metallic blue car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3796dc37ec91cdd8.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any red brick building at upper center in the image." }, { "from": "gpt", "value": "[(0.849, 0.325)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2f3c7151c11d2aa.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.546, 0.558) positioned before point (0.517, 0.709)?" }, { "from": "gpt", "value": "No, it is behind (0.517, 0.709)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e84c3426bd240c0.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the natural wood railing at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.787, 0.892)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53c9613d491529ec.jpg", "conversations": [ { "from": "human", "value": "\nYou are a guest sitting on the sofa facing the gold metallic round table at center. You want to reach the black glossy drawer at right to grab a remote control. Can you directly access it without moving around the table?" }, { "from": "gpt", "value": "The black glossy drawer at right is in front of the gold metallic round table at center, so yes, you can directly access the black glossy drawer at right without needing to move around the table since it is positioned in front of it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e9d45a4d255b14a.jpg", "conversations": [ { "from": "human", "value": "\nBetween blue shirt at center and white cloth at center, which one has less height?" }, { "from": "gpt", "value": "Standing shorter between the two is white cloth at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6fcbd1306f10466.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, blue plastic chair at lower right or striped fabric tie at left?" }, { "from": "gpt", "value": "blue plastic chair at lower right is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/874a59997029748f.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the pink satin shirt at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.460, 0.544)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/662dd1d610e2ce2a.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.687, 0.591) farther from camera compared to point (0.278, 0.847)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.278, 0.847)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d90851f53c5b5cf.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between light green shirt at center and green textured shirt at center?" }, { "from": "gpt", "value": "A distance of 3.55 inches exists between light green shirt at center and green textured shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63af96a8303b9e34.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.932, 0.886) more distant than point (0.400, 0.647)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf7a60e5a7fba7b8.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped cotton shirt at center appear over brown matte food at center?" }, { "from": "gpt", "value": "Indeed, striped cotton shirt at center is positioned over brown matte food at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/acb31a18988aed5c.jpg", "conversations": [ { "from": "human", "value": "\nBetween purple striped shirt at center and black matte shirt at upper right, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, purple striped shirt at center appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99bf4df6ab424e4e.jpg", "conversations": [ { "from": "human", "value": "\nBetween white wooden railing at upper center and pink fleece jacket at center, which one is positioned higher?" }, { "from": "gpt", "value": "white wooden railing at upper center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/281ef7ff53471e63.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.445, 0.425) or (0.251, 0.255)?" }, { "from": "gpt", "value": "The point (0.251, 0.255) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c23e94fe08f2e3ae.jpg", "conversations": [ { "from": "human", "value": "\nWhere is metallic silver eiffel tower at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.482, 0.497)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c48d0f72d069f9bb.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a photo of the olive green parka at center and the white matte duck at center. Which object should you zoom in on to ensure both are clearly visible in the frame?" }, { "from": "gpt", "value": "The olive green parka at center has a larger size compared to the white matte duck at center. To ensure both are clearly visible, you should zoom out slightly so that the larger olive green parka at center doesn t fill the frame too much, allowing space for the smaller white matte duck at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59ea9b07594d9512.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric shirt at lower center closer to the viewer compared to dark gray suit at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4bfb04c069cb906.jpg", "conversations": [ { "from": "human", "value": "\nIs polished wood door at center bigger than white paper sign at lower left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a71cdefd008bf811.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a yellow fabric tent at center. Pinpoint a point to the yellow fabric tent at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.566, 0.634)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0df64d7ad38d71c1.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.702, 0.380) come behind point (0.339, 0.433)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5436e2cca3982aae.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the decorative fence with orange and white pillars. There is a point marked at coordinates (0.192, 0.894). Based on the scene description, where is this point located?" }, { "from": "gpt", "value": "The point is on the white concrete path at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08a68c8b2f7a7b68.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.489, 0.608) farther from viewer compared to point (0.461, 0.573)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1a5b24d790c04ee.jpg", "conversations": [ { "from": "human", "value": "\nHow much distance is there between brown polished pole at center and black leather uniform at center?" }, { "from": "gpt", "value": "brown polished pole at center is 16.33 feet away from black leather uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d77c57f3212e45b1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to place a small package on the brick pavement at center. However, there is a blue printed fabric dress at center in the way. Can you place the package there without moving the dress?" }, { "from": "gpt", "value": "The brick pavement at center is wider than the blue printed fabric dress at center, so there is enough space to place the package without moving the dress." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b363f09c1bdab0e9.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the dock next to the SUSITNA ferry. You want to throw a small floating toy into the water. The toy needs to travel at least 150 feet to reach the middle of the glossy dark blue water at center. Do you think the toy will reach the middle of the water?" }, { "from": "gpt", "value": "The distance between the glossy dark blue water at center and the camera is 152.08 feet. Since the toy needs to travel at least 150 feet, it will just barely reach the middle of the glossy dark blue water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcb0dda636fa887f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver who needs to park your vehicle precisely at the rear of the silver Nissan Qashqai shown. The parking spot has a strict boundary marked by the metallic gray curb at lower center. Using the coordinate system where the bottom left corner of the image is the origin point, can you determine if the current position of the silver Nissan Qashqai is within the allowed parking boundaries defined by the curb?" }, { "from": "gpt", "value": "The metallic gray curb at lower center is located at coordinate point (0.867, 0.838). Since the Nissan Qashqai is parked in front of the beige tiled wall and the curb marks the boundary, the car is positioned within the allowed parking area as it is parked in front of the curb." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bbfafb58b637fb70.jpg", "conversations": [ { "from": "human", "value": "\nLocate all black wool coat at center in the image." }, { "from": "gpt", "value": "[(0.509, 0.672)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/312fefff1ddcc74d.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the camouflage fabric rifle at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.606, 0.633)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b9e55c066432d5a.jpg", "conversations": [ { "from": "human", "value": "\nDoes black satin dress at center have a smaller size compared to silver metallic laptop at upper left?" }, { "from": "gpt", "value": "No, black satin dress at center is not smaller than silver metallic laptop at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0613bf23dfc76ae7.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.474, 0.781)?" }, { "from": "gpt", "value": "matte red tractor at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d034c418044ac46d.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth bark tree at center appear on the right side of smooth gray tree trunk at center?" }, { "from": "gpt", "value": "Correct, you'll find smooth bark tree at center to the right of smooth gray tree trunk at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80902bdc7cec793e.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of matte black sunglasses at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.287, 0.622)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59aab415572296d8.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between neon/glass tube at upper center and camera?" }, { "from": "gpt", "value": "neon/glass tube at upper center and camera are 4.14 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0207fd3d33dfe223.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of painted wood bird feeder at center in the image." }, { "from": "gpt", "value": "[(0.475, 0.567)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75064d5f452fef39.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.035, 0.834) or (0.912, 0.428)?" }, { "from": "gpt", "value": "Positioned behind is point (0.912, 0.428)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e73e05e2725de000.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing behind the two children. You want to take a photo that includes both the matte red shirt at left and the yellow chalk at center. Which object should you focus on first to ensure both are in clear view?" }, { "from": "gpt", "value": "The matte red shirt at left is closer to the viewer than the yellow chalk at center, so you should focus on the matte red shirt at left first to ensure both are in clear view." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d10e89bfda845a5d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a student in the classroom. You need to pass a note to the student wearing the plaid shirt at right. If you are currently at the white shirt at center, how far do you have to walk to reach them?" }, { "from": "gpt", "value": "The white shirt at center is 7.96 feet from the plaid shirt at right, so you would need to walk approximately 8 feet to reach them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d77eff3d5d76dfae.jpg", "conversations": [ { "from": "human", "value": "\nDoes white plastic sign at center have a lesser width compared to shiny black sedan at center?" }, { "from": "gpt", "value": "Yes, white plastic sign at center is thinner than shiny black sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2907321f870633b.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.843, 0.237) positioned behind point (0.853, 0.422)?" }, { "from": "gpt", "value": "Yes, point (0.843, 0.237) is farther from viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33793eab2f41dbce.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink satin blouse at center lie behind gray concrete pavement at lower left?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0ecfb4f9725ae62.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer positioned at the back of the church aisle. You need to capture a clear photo of both the white tulle dress at center and the white satin dress at center. Which dress will appear shorter in the photo?" }, { "from": "gpt", "value": "The white tulle dress at center will appear shorter in the photo because it is not as tall as the white satin dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ad11c6a7d1b8194.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.513, 0.956) or (0.283, 0.762)?" }, { "from": "gpt", "value": "Positioned behind is point (0.283, 0.762)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c562ffbecfa89288.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to blue water at center? Please provide its 2D coordinates.Where can I find blue water at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.242, 0.702)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb769bf56a357777.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.510, 0.897) or point (0.999, 0.961)?" }, { "from": "gpt", "value": "Point (0.510, 0.897)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af0e838bb18737cd.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of dark blue shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.770, 0.648)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cab6080726edec3b.jpg", "conversations": [ { "from": "human", "value": "\nIn the LEGO diorama of the cozy diner scene, there is a shiny brown bowl at center and a smooth brown minifigure at center. Which object is taller?" }, { "from": "gpt", "value": "The shiny brown bowl at center is taller than the smooth brown minifigure at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6156b4ca619ee936.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the smooth sand beach at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.736, 0.884)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5c7341690ad2e1d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to brown gravel dirt at center.Point to the brown gravel dirt at center in the image." }, { "from": "gpt", "value": "[(0.531, 0.794)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe95e4ff55e4a0f3.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue jacket at center have a lesser height compared to dark gray wool coat at center?" }, { "from": "gpt", "value": "Incorrect, dark blue jacket at center's height does not fall short of dark gray wool coat at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20d0f73aedc677cd.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the protest and want to capture both the purple cotton shirt at upper right and the red fabric flag at lower center in the same frame. Which object should you focus on first to ensure both are in the frame?" }, { "from": "gpt", "value": "The purple cotton shirt at upper right is above the red fabric flag at lower center, so you should focus on the purple cotton shirt at upper right first to ensure both are in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e246d0c037691b34.jpg", "conversations": [ { "from": "human", "value": "\nIs matte orange dress at center taller than matte black tie at center?" }, { "from": "gpt", "value": "Correct, matte orange dress at center is much taller as matte black tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b37af9f17d45dffa.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of brown matte bird at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.319, 0.530)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f0ce43b40b08940.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between wooden church at center and camera?" }, { "from": "gpt", "value": "A distance of 76.38 meters exists between wooden church at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6be88c9989ccf944.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.666, 0.358)?" }, { "from": "gpt", "value": "black fabric banner at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/031902d7048d5eb6.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of camouflage fabric us army uniform at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.465, 0.473)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4b4b6827648dfb8.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the waterfront and want to take a photo of the blue glassy water at center. How far do you need to walk forward to get closer to it?" }, { "from": "gpt", "value": "The blue glassy water at center is 175.98 feet away from the camera. To get closer, you would need to walk forward approximately 175.98 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/174630750110e795.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.677, 0.811) and point (0.891, 0.475), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.891, 0.475) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6b402593534fefe.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the clear glass window at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.777, 0.377)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5b66936a1ddd242.jpg", "conversations": [ { "from": "human", "value": "\nPoint to metallic gray fence at center.Point to the metallic gray fence at center in the image." }, { "from": "gpt", "value": "[(0.499, 0.333)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e8f25dd3141afbb.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing 5 feet away from the table in the meeting room. There is a point at coordinates (0.804, 0.234) in the image. Can you reach that point without moving closer to the table?" }, { "from": "gpt", "value": "The distance of point (0.804, 0.234) from viewer is 6.68 feet. Since you are currently 5 feet away from the table, the point is 1.68 feet further away from you, so you cannot reach it without moving closer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf21d9db3c7c8f22.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, stainless steel pot at right or white glossy pillar at center, stands taller?" }, { "from": "gpt", "value": "With more height is white glossy pillar at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3cb6f99f78beabf.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.669, 0.684) or (0.559, 0.375)?" }, { "from": "gpt", "value": "Point (0.559, 0.375) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b572858f084eaf84.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.517, 0.611)?" }, { "from": "gpt", "value": "blue matte toy car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc82b837b9bbef91.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.803, 0.527)?" }, { "from": "gpt", "value": "brown textured dinosaur at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11cd829c1e54af60.jpg", "conversations": [ { "from": "human", "value": "\nLocate all gray rough boulder at lower center in the image." }, { "from": "gpt", "value": "[(0.430, 0.931)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c56630cb12fc081.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.760, 0.342) closer to viewer compared to point (0.355, 0.680)?" }, { "from": "gpt", "value": "Yes, point (0.760, 0.342) is in front of point (0.355, 0.680)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36def1eebd8a4b24.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of golden glass chandelier at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.938, 0.073)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d912d55f21ce87f8.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the matte black goggles at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.569, 0.814)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57e6a54bdeaaf627.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the dark brown jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.346, 0.630)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/585478b1b1cd049b.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to park your black matte bicycle at lower right near the white wooden window at center. Considering the space between them, can the bicycle fit without blocking the window?" }, { "from": "gpt", "value": "The black matte bicycle at lower right might be wider than white wooden window at center, so there is a possibility that parking the bicycle could block the window. Check the exact dimensions before deciding." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32c31aa1a040aa8d.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between green reflective water at center and camera." }, { "from": "gpt", "value": "The distance of green reflective water at center from camera is 6.64 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8561fe7aa35379f7.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange perforated metal building at center have a larger size compared to brown water at lower center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddd8fb90d65ffb58.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the winter sports event and want to know how far the point marked at coordinates (0.788, 0.716) is from your current position. Can you determine the distance?" }, { "from": "gpt", "value": "The point marked at coordinates (0.788, 0.716) is 150.19 meters away from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00728223e1e87e11.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, denim at center or matte black phone at center?" }, { "from": "gpt", "value": "matte black phone at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1dfef32606c27204.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of green leafy tree at left in the image." }, { "from": "gpt", "value": "[(0.124, 0.530)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38430c5c44f34018.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.171, 0.625) positioned after point (0.604, 0.592)?" }, { "from": "gpt", "value": "No, (0.171, 0.625) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95aa2c58e3e00d4c.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the blonde synthetic hair at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.731, 0.237)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90290c44e39abe96.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, silver metallic car at center or satin silver car at center?" }, { "from": "gpt", "value": "satin silver car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be5a267825fdfa83.jpg", "conversations": [ { "from": "human", "value": "\nYou are a medical student observing a surgery. You notice the matte blue gown at center and the satin silver scalpel at center. Which object takes up more horizontal space in the image?" }, { "from": "gpt", "value": "The matte blue gown at center has a larger width than the satin silver scalpel at center, so it takes up more horizontal space." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d181b4f088969bc.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the valley and see the green textured mountain at center and the green textured tree at lower center. Which one is positioned to the left from your viewpoint?" }, { "from": "gpt", "value": "The green textured mountain at center is positioned to the left of the green textured tree at lower center from your viewpoint." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/647bdcd06a833450.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black dress at left closer to the viewer compared to matte black dress at center?" }, { "from": "gpt", "value": "Yes, matte black dress at left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/235bccb1ca505475.jpg", "conversations": [ { "from": "human", "value": "\nLocate smooth brown log at center in the image." }, { "from": "gpt", "value": "[(0.424, 0.577)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/028c7d9a98bbebb2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a group photo. You need to position two markers at coordinates point (0.698, 0.628) and point (0.110, 0.963). Which marker is closer to the camera?" }, { "from": "gpt", "value": "Point (0.698, 0.628) is closer to the camera than point (0.110, 0.963)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/470620573f132445.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.297, 0.661)." }, { "from": "gpt", "value": "green grassy field at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5f780e6d27aecb4.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.529, 0.369) come closer to viewer compared to point (0.984, 0.050)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f8ecad4942f47bc.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.407, 0.658) closer to camera compared to point (0.355, 0.831)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd8cf375a8889025.jpg", "conversations": [ { "from": "human", "value": "\nYou are a sound technician setting up for a presentation. You need to ensure the microphone closest to the speaker is the one with the best audio quality. Which microphone should you choose between the black glossy microphone at center and the black metallic microphone at center?" }, { "from": "gpt", "value": "The black glossy microphone at center is in front of the black metallic microphone at center, so the black glossy microphone at center is closer to the speaker and should be chosen for better audio quality." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6a66145c1b11f46.jpg", "conversations": [ { "from": "human", "value": "\nYou are a farmer who wants to install a sprinkler system to water both the green grassy at center and the green grassy hillside at left. The sprinkler can cover up to 200 feet. Is the distance between them within the sprinkler system coverage?" }, { "from": "gpt", "value": "The distance between the green grassy at center and the green grassy hillside at left is 180.29 feet, which is within the sprinkler system coverage of 200 feet. Therefore, the sprinkler can effectively water both areas." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92b58d4196989490.jpg", "conversations": [ { "from": "human", "value": "\nLocate all black matte diving suit at center in the image." }, { "from": "gpt", "value": "[(0.337, 0.598)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef33c0f17f135e73.jpg", "conversations": [ { "from": "human", "value": "\nLocate the matte pink scarf at center in the image." }, { "from": "gpt", "value": "[(0.665, 0.512)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08dd92eb250d84a0.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white stone rock at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.517, 0.561)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6da70acb02dec97.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a seating arrangement for an event under the canopy. You have two chairs available. The first chair is designed to fit the blue leather suit at upper right, and the second chair is for the blue uniform at center. Which chair requires more width to accommodate the wearer?" }, { "from": "gpt", "value": "The chair for the blue leather suit at upper right requires more width because the blue leather suit at upper right is wider than the blue uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d481db0509d0137.jpg", "conversations": [ { "from": "human", "value": "\nYou are a stagehand needing to move a 30 feet long extension cord from the black fabric camera at center to the light blue denim jacket at lower right. Can you safely lay the cord along the path between them without it being too short?" }, { "from": "gpt", "value": "The distance between the black fabric camera at center and the light blue denim jacket at lower right is 25.52 feet. Since the extension cord is 30 feet long, it is longer than the required distance, so you can safely lay the cord without it being too short." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/989dbeb821a9cb9a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white powdery snow at center is positioned below bare wood tree at center?" }, { "from": "gpt", "value": "Correct, white powdery snow at center is located below bare wood tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/017427eff16cc96a.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white matte bicycle at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.279, 0.750)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abfd6befde2ad92a.jpg", "conversations": [ { "from": "human", "value": "\nBetween polka dot blouse at left and wooden box at center, which one has less height?" }, { "from": "gpt", "value": "wooden box at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8531528ec4328e65.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.621, 0.534) positioned behind point (0.385, 0.878)?" }, { "from": "gpt", "value": "No, (0.621, 0.534) is in front of (0.385, 0.878)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c6f07be75ae7915.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.310, 0.347)?" }, { "from": "gpt", "value": "orange matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2caca4ad2147b9e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.594, 0.480)?" }, { "from": "gpt", "value": "orange fabric bulletin board at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80a992a3671af23f.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.132, 0.452) and camera?" }, { "from": "gpt", "value": "The distance of point (0.132, 0.452) from camera is 2.31 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81aaad5d92a8858d.jpg", "conversations": [ { "from": "human", "value": "\nYou have a small container that can only hold items up to the size of the brown rough stone at lower center. Can you fit the white plastic bag at lower left into the container without it overflowing?" }, { "from": "gpt", "value": "The white plastic bag at lower left is larger in width than the brown rough stone at lower center, so it won" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbf2d6fe0d5d0237.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.387, 0.730)?" }, { "from": "gpt", "value": "light blue uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d04b9033f6e3bae.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.547, 0.309)?" }, { "from": "gpt", "value": "green mossy rock at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5bee2e5d9bee10f.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray concrete stairs at center have a smaller size compared to white matte chair at lower left?" }, { "from": "gpt", "value": "Incorrect, dark gray concrete stairs at center is not smaller in size than white matte chair at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e464036e9c7799d.jpg", "conversations": [ { "from": "human", "value": "\nIs black wire at upper center in front of brown brick buildings at center?" }, { "from": "gpt", "value": "No, black wire at upper center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/977e6eb0c8448a80.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.298, 0.322) and point (0.635, 0.308), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.298, 0.322) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2968e25217418c38.jpg", "conversations": [ { "from": "human", "value": "\nIs green fabric scarf at left above green matte mangoes at center?" }, { "from": "gpt", "value": "Yes, green fabric scarf at left is above green matte mangoes at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0898db255df1d21a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.015, 0.553) or point (0.417, 0.386)?" }, { "from": "gpt", "value": "Point (0.417, 0.386) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/098e420d95ec09ed.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.304, 0.833) behind point (0.954, 0.445)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7b09675caf40074.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.164, 0.384) from camera?" }, { "from": "gpt", "value": "Point (0.164, 0.384) and camera are 1.11 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd7a297bddb4d132.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.588, 0.998) or point (0.312, 0.466)?" }, { "from": "gpt", "value": "Point (0.312, 0.466) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9262cbd2f6ba9a7c.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.743, 0.081) and camera." }, { "from": "gpt", "value": "They are 9.96 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60e5bb84ef83580b.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of silver metallic sedan at right?" }, { "from": "gpt", "value": "silver metallic sedan at right is 13.65 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b8e8f69140a8abd.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.127, 0.131) from camera?" }, { "from": "gpt", "value": "A distance of 21.84 meters exists between point (0.127, 0.131) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f3039ef6a1d845a.jpg", "conversations": [ { "from": "human", "value": "\nIs painted vinyl van at center to the right of black felt cowboy hat at center from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, painted vinyl van at center is not on the right side of black felt cowboy hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61c1364922bb43b6.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.715, 0.228) come behind point (0.644, 0.722)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2822c3eb5f1738cd.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.931, 0.120) positioned behind point (0.096, 0.741)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/026bf1fc1aace3dc.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.184, 0.925)?" }, { "from": "gpt", "value": "Point (0.184, 0.925) and camera are 366.66 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b03de0161c384c8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a zookeeper observing the gorilla enclosure. You notice a point marked at coordinates (0.514, 0.648). What object does this point correspond to?" }, { "from": "gpt", "value": "The point at coordinates (0.514, 0.648) corresponds to the shiny black monkey at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8eb7d0cb4c6e5c22.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the dining table and want to reach both points on the table. Which point, point (0.192, 0.883) or point (0.526, 0.423), is closer to you?" }, { "from": "gpt", "value": "Point (0.192, 0.883) is closer to the viewer than point (0.526, 0.423)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe53f99dbda7bc78.jpg", "conversations": [ { "from": "human", "value": "\nIs matte yellow t-shirt at left positioned before yellow matte shirt at center?" }, { "from": "gpt", "value": "Yes, it is in front of yellow matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f6477fc68416b7c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green matte leaf at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.260, 0.600)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a9a05a06ce45704.jpg", "conversations": [ { "from": "human", "value": "\nIs brown brick houses at lower center closer to the viewer compared to brown stone tower at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/790d97cfc6553b13.jpg", "conversations": [ { "from": "human", "value": "\nYou are an event planner arranging a photoshoot. You need to ensure that the gold shiny robe at center and the matte floral dress at left are visible in the frame. Based on their positions, which one is closer to the camera?" }, { "from": "gpt", "value": "The gold shiny robe at center is positioned under the matte floral dress at left, meaning it is closer to the camera since it is placed lower in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/774a72e3ac1268dd.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer sitting at the round table with black metal chairs in the foreground of the cozy interior space. You want to hang a matte black picture frame on the wall above the table. The coordinates given are in the image coordinate system where the origin is at the bottom left corner. Can you confirm if the point marked at (0.621, 0.270) is suitable for hanging the frame above the table?" }, { "from": "gpt", "value": "The point marked at (0.621, 0.270) corresponds to the matte black picture frame at upper center, which is already placed there. Since the frame is already at that location, it is suitable for hanging the matte black picture frame above the table." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e58fbd8569d549a9.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the street and see the bus with the AD5008 plate and the restaurant sign. You want to walk to the point marked at coordinates (0.753, 0.383). Is this point closer to you than 7 meters?" }, { "from": "gpt", "value": "The distance of point (0.753, 0.383) from viewer is 6.74 meters, so yes, the point is closer than 7 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e2cd1aa8051ea86.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of dark brown fabric headboard at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.560, 0.308)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2834b086a605ed37.jpg", "conversations": [ { "from": "human", "value": "\nWhat are the coordinates of the camouflage fabric uniform at center?" }, { "from": "gpt", "value": "The camouflage fabric uniform at center is located at coordinates point (0.541, 0.680)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/735206c07fa1f55f.jpg", "conversations": [ { "from": "human", "value": "\nPoint to light brown hair at center.Point to the light brown hair at center in the image." }, { "from": "gpt", "value": "[(0.869, 0.977)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0068b5f37812eb5a.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.450, 0.906) and point (0.530, 0.558), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.450, 0.906)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9caeae6e4422841b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown leather coat at center is shorter than white satin dress at lower right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cf044902b22f0f4.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.404, 0.945) closer to camera compared to point (0.302, 0.645)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/270948abe5dcb86a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, green grass at lower right or gray concrete at lower left, stands taller?" }, { "from": "gpt", "value": "With more height is gray concrete at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5909ae52379cba17.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.917, 0.453)?" }, { "from": "gpt", "value": "shiny black hair at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e962ba04a68f4c8.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of pink stone building at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.604, 0.534)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b29887c19ef25f8.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of light skin hands at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.137, 0.691)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f43ba07d6886c44.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the smooth concrete waterway at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.514, 0.698)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/657ffb9dcbfb015a.jpg", "conversations": [ { "from": "human", "value": "\nIs leather couch at center above black carved wood sign at center?" }, { "from": "gpt", "value": "Incorrect, leather couch at center is not positioned above black carved wood sign at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2d96bbb5f3504d1.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to wooden/rustic fence at center? Please provide its 2D coordinates.Where can I find wooden/rustic fence at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.500, 0.809)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d74e633509fcff1e.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.750, 0.561) and point (0.238, 0.853), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.750, 0.561) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52d0ff562145945a.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the wooden at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.545, 0.833)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02decf94eb71a979.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the landscape and want to take a photo of both the snowy rocky mountain range at upper left and the green leafy tree at center. Which object should you focus on first to ensure both are in the frame?" }, { "from": "gpt", "value": "You should focus on the green leafy tree at center first because it is closer to you than the snowy rocky mountain range at upper left, so adjusting the camera to include the closer tree will also capture the distant mountains in the background." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/909ab53305d417fd.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a photoshoot and need to arrange two green dresses from left to right. The velvet green dress at center and the satin dark green dress at center are available. According to the image, which dress should be placed on the left side?" }, { "from": "gpt", "value": "The velvet green dress at center should be placed on the left side because it is positioned on the left side of the satin dark green dress at center in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b618747c9964cf8.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, gray fleece jacket at center or blue fabric shirt at center?" }, { "from": "gpt", "value": "blue fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2ad814f9bcf83b5.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte red beret at center and dark blue jersey at center, which one is positioned lower?" }, { "from": "gpt", "value": "dark blue jersey at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4346c450eb92745b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if pink cotton shirt at center is thinner than white cotton dress at center?" }, { "from": "gpt", "value": "Incorrect, pink cotton shirt at center's width is not less than white cotton dress at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61f49ddc22e8a7cb.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the dark gray suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.546, 0.611)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/958f09d5862fded0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the red fabric flags at center in the nighttime scene. The camera you are using has a limited field of view and can only focus on objects within a specific coordinate range. Given that the coordinate system starts at the bottom left corner of the image, with the origin at 0.0, 0.0 and maximum coordinates at 1.0, 1.0, can you confirm if the point you are aiming at, point (0.161, 0.870), is indeed where the red fabric flags at center are located?" }, { "from": "gpt", "value": "Yes, the point (0.161, 0.870) corresponds to the red fabric flags at center, so aiming at that coordinate will capture them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7ac46cbae12569e.jpg", "conversations": [ { "from": "human", "value": "\nDoes white cotton shirt at right have a greater width compared to white matte shirt at center?" }, { "from": "gpt", "value": "In fact, white cotton shirt at right might be narrower than white matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fd2eed1f74baf35.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center have a lesser height compared to transparent rubber windshield at lower center?" }, { "from": "gpt", "value": "Incorrect, green leafy tree at center's height does not fall short of transparent rubber windshield at lower center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d93c40d9c210ed5d.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the gray suit at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.352, 0.348)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc0ffbccd7844229.jpg", "conversations": [ { "from": "human", "value": "\nCould you measure the distance between weathered wood hut at center and rustic wooden wagon at center?" }, { "from": "gpt", "value": "weathered wood hut at center is 24.50 meters from rustic wooden wagon at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b98002c5ccff5633.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the pink fabric flag at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.609, 0.427)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/581a546e22e80ae7.jpg", "conversations": [ { "from": "human", "value": "\nDoes red matte jacket at center have a greater height compared to matte pink sweater at center?" }, { "from": "gpt", "value": "No, red matte jacket at center is not taller than matte pink sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b10dc65e4a833d76.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a green striped polo shirt at left. Pinpoint a point to the green striped polo shirt at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.281, 0.677)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d3fcd490b982b06.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, white wooden bookshelf at left or matte pink bikini top at center, stands taller?" }, { "from": "gpt", "value": "white wooden bookshelf at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc61b4a136376e1f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, metallic silver microphone at upper center or black metallic microphone at center, stands taller?" }, { "from": "gpt", "value": "With more height is metallic silver microphone at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f65adccc914821fe.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at a wedding and need to adjust the camera settings to capture both the white satin dress at center and the matte gray suit at center clearly. Since the dress is narrower, you decide to focus on the wider object. Which object should you focus on?" }, { "from": "gpt", "value": "The white satin dress at center is narrower than the matte gray suit at center, so you should focus on the matte gray suit at center as it is wider." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7cf5446cc5d9640.jpg", "conversations": [ { "from": "human", "value": "\nBetween black matte door at center and black matte signboard at center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "Positioned to the right is black matte signboard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3beb4fc164731b6a.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.311, 0.331) or (0.716, 0.302)?" }, { "from": "gpt", "value": "Point (0.311, 0.331)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/527bdfe5f46e7a60.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.971, 0.095) in front of point (0.642, 0.516)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52f253269b01ad0b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white matte shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.538, 0.508)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c411d68e1166f9e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.090, 0.438) or point (0.339, 0.644)?" }, { "from": "gpt", "value": "Positioned behind is point (0.339, 0.644)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af67b5cd8790d137.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the highest point of the hill and looking down. Which wooden cabin is closer to you, the wooden cabin at center or the wooden cabin at left?" }, { "from": "gpt", "value": "The wooden cabin at center is closer to you because it is located below the wooden cabin at left, meaning it is situated lower on the slope and thus nearer to your vantage point at the top." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d0d5f48b2bc90e0.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.377, 0.825) and camera." }, { "from": "gpt", "value": "They are 13.80 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47700efd6a56d538.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy table at center is smaller than dark suit at center?" }, { "from": "gpt", "value": "No, white glossy table at center is not smaller than dark suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33d0ae5762d41d2d.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.383, 0.711) and camera?" }, { "from": "gpt", "value": "Point (0.383, 0.711) and camera are 291.27 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02c9edc8cacebc1c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of red dotted shirt at center?" }, { "from": "gpt", "value": "A distance of 2.95 meters exists between red dotted shirt at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6f277c2a00299b6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.859, 0.294)?" }, { "from": "gpt", "value": "green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e39c920d4a582c56.jpg", "conversations": [ { "from": "human", "value": "\nLocate the wooden boardwalk at center-right in the image." }, { "from": "gpt", "value": "[(0.784, 0.891)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d1663e63cfdce8c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer reviewing this image of the Eiffel Tower. You notice the black woolen sweater at upper left and the smooth skin hand at upper center. Which object is located more to the left in the image?" }, { "from": "gpt", "value": "The black woolen sweater at upper left is positioned more to the left than the smooth skin hand at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f849060844888d68.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange scarf at center is smaller than smooth black hair at center?" }, { "from": "gpt", "value": "No, orange scarf at center is not smaller than smooth black hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6a8d127e1697f05.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green textured tree at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.313, 0.331)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f23598f2c6f7c767.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the party and want to take a photo of both the pink satin shirt at center and the matte white shirt at center. However, you need to ensure that both shirts are fully visible in the photo. Based on their positions, which shirt should you focus on first to ensure the other is also in the frame?" }, { "from": "gpt", "value": "The pink satin shirt at center is in front of the matte white shirt at center. To ensure both are fully visible, focus on the matte white shirt at center first, as it is behind and adjusting focus there might keep the pink satin shirt at center in the frame as well." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b19567e2bd430c2.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.380, 0.361) or point (0.257, 0.752)?" }, { "from": "gpt", "value": "Point (0.257, 0.752) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb12a232d9d2b384.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of yellow matte shirt at upper center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.604, 0.128)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a011226c01e2faa.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.745, 0.827)?" }, { "from": "gpt", "value": "green grassy field at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92449fea69c4d922.jpg", "conversations": [ { "from": "human", "value": "\nBetween black fabric shirt at center and silver metallic laptop at left, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "silver metallic laptop at left is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b99bef0e5de718a.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray fleece jacket at left appear over matte purple sweatshirt at center?" }, { "from": "gpt", "value": "No, gray fleece jacket at left is not above matte purple sweatshirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1fc2aacd1f99cd3.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white matte bow tie at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.514, 0.592)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97ec2af3c98b5a07.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green matte can at lower left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.229, 0.958)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/720fbde29be3a19d.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.642, 0.536) positioned after point (0.359, 0.750)?" }, { "from": "gpt", "value": "Yes, point (0.642, 0.536) is farther from viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cb44243a7414c67.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and want to take a photo that includes both the blue fabric shirt at upper right and the matte black apron at left. Which of the two items should you position closer to the bottom of the frame to ensure both are fully visible?" }, { "from": "gpt", "value": "The blue fabric shirt at upper right is not as tall as matte black apron at left. To ensure both are fully visible in the photo, position the shorter blue fabric shirt at upper right closer to the bottom of the frame so that its shorter height accommodates within the frame along with the taller matte black apron at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a92b30786c52c418.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of white fluffy cloud at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.451, 0.683)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ad019010fcf07b8.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, orange crumbly pastry at center or golden-brown crispy pastry at center?" }, { "from": "gpt", "value": "Positioned lower is orange crumbly pastry at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/319762cdbb6a4728.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.418, 0.955) closer to viewer compared to point (0.529, 0.666)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed21dd98fbe620c1.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.266, 0.744) come farther from viewer compared to point (0.578, 0.578)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca02dd561f410a16.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position in the winter landscape scene. There is a point marked at coordinate point (0.317, 0.233). If you want to walk directly to that point, how far would you have to walk in feet?" }, { "from": "gpt", "value": "The distance between the camera and point (0.317, 0.233) is 209.97 feet, so you would have to walk 209.97 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5450053a04f24a4.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.648, 0.202)?" }, { "from": "gpt", "value": "3.10 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9040e60084f9d549.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green textured tree at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.537, 0.300)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dad10b7c15396d49.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.193, 0.850) and camera?" }, { "from": "gpt", "value": "They are 5.68 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb802a91339a57a2.jpg", "conversations": [ { "from": "human", "value": "\nYou are on the motorboat Cantius and need to determine the position of two points marked on the deck. Which point is closer to you, point (0.497, 0.048) or point (0.421, 0.136)?" }, { "from": "gpt", "value": "Point (0.497, 0.048) is further to the viewer than point (0.421, 0.136), so point (0.421, 0.136) is closer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4b9e0d9cf4c3414.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.760, 0.995) come closer to viewer compared to point (0.313, 0.645)?" }, { "from": "gpt", "value": "Yes, point (0.760, 0.995) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/661d4f579727d229.jpg", "conversations": [ { "from": "human", "value": "\nBetween stone tower at center and stone clock tower at center, which one is positioned higher?" }, { "from": "gpt", "value": "stone clock tower at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9221d8a357a96db.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the rustic covered bridge and notice two elements in the scene. One is the rusty metal barn at center and the other is the bare branches at left. From your vantage point on the bridge, which of these two objects appears closer to you?" }, { "from": "gpt", "value": "The rusty metal barn at center is located below the bare branches at left, so from your position on the bridge, the bare branches at left would appear closer because they are positioned above the barn." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/824d40f908246db6.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, green textured tree at upper center or green water at lower center?" }, { "from": "gpt", "value": "Positioned to the left is green textured tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d99ad8b519b474a6.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the matte gold lamp at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.556, 0.558)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6228cb7d6e53326.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.112, 0.442) or point (0.552, 0.547)?" }, { "from": "gpt", "value": "Positioned in front is point (0.552, 0.547)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59dd9e9e8fc9e571.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.270, 0.695) from the camera?" }, { "from": "gpt", "value": "Point (0.270, 0.695) and camera are 72.17 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f73001ac1514abf.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the floral cotton dress at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.340, 0.795)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/609ef348d55b25f9.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.497, 0.616)?" }, { "from": "gpt", "value": "orange lace dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e91293c8a4114fe.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the matte silver sedan at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.743, 0.861)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0346eee158d08acb.jpg", "conversations": [ { "from": "human", "value": "\nYou are a LEGO builder trying to place a blue matte helmet at center on top of the green matte vehicle at center. Based on the size of the helmet and the vehicle, will the helmet fit securely on top without falling off?" }, { "from": "gpt", "value": "The green matte vehicle at center is bigger than the blue matte helmet at center, so the helmet will fit securely on top without falling off." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb8902b41b7cc2d0.jpg", "conversations": [ { "from": "human", "value": "\nBetween dark gray jacket at right and white fluffy snowball at upper center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, dark gray jacket at right appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78c44dc04fae7941.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the dark blue suit at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.202, 0.836)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f99bcaed521df5d4.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the concrete bunker at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.139, 0.259)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b40d388159e1f16c.jpg", "conversations": [ { "from": "human", "value": "\nIs light brown hair at lower left below smooth skin face at lower left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69ef533f41e352d1.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of 2 JAYS CAFE and want to know how far the point at coordinates point (0.690, 0.984) is from you. Can you determine the distance?" }, { "from": "gpt", "value": "The distance between you and point (0.690, 0.984) is 200.34 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7433ca036edee067.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green leafy tree at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.723, 0.819)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27b0a0f00af3bee4.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, brown muddy water at center or orange fabric saree at center?" }, { "from": "gpt", "value": "brown muddy water at center is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8333e8c50b909a4c.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.023, 0.122) positioned in front of point (0.673, 0.022)?" }, { "from": "gpt", "value": "Yes, point (0.023, 0.122) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f1847d8e1657500.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.225, 0.906) and point (0.489, 0.509), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.225, 0.906)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/116aa0742e21e486.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of dark brown hair at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.485, 0.762)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62c1d28bfd5d67a4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker planning to drive a 3.5 meter wide truck along the brown dirt track at lower center near the brown rocky mountain at center. Based on the scene, can the truck safely pass through the track?" }, { "from": "gpt", "value": "The brown dirt track at lower center is narrower than the brown rocky mountain at center, but the width comparison between the track and the truck is not provided. However, since the track is narrower than the mountain, it might not be wide enough for the truck. Further information about the track width is needed to confirm." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b4eee24854be114.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist planning to paint the scene. You want to ensure the green leafy tree at upper center and the polished bronze sculpture at center are proportionally accurate. Which object should you make wider in your painting?" }, { "from": "gpt", "value": "The green leafy tree at upper center should be made wider in the painting since its width is larger than the polished bronze sculpture at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7083134a1efcf75a.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.714, 0.839)." }, { "from": "gpt", "value": "brown copper penny at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/273da9d54d8e3766.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the kitchen facing the sink area. There are two points marked in the scene. Which point, point (0.902, 0.223) or point (0.927, 0.011), is closer to you?" }, { "from": "gpt", "value": "Point (0.927, 0.011) is closer to you because it is in front of point (0.902, 0.223)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d5b3470f42622b5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a photo of the white embroidered shirt at left and the yellow matte corn at center. Since you want both subjects to be in focus, you need to know which one is taller. Can you tell me which one is taller?" }, { "from": "gpt", "value": "The white embroidered shirt at left is much taller than the yellow matte corn at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d8933749b1009fb.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, white matte table at center or green matte bottle at lower left?" }, { "from": "gpt", "value": "white matte table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ded7949218c0780.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.656, 0.592) and point (0.551, 0.425), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.551, 0.425) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6e1131feac8d4a5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, black matte person at lower center or dark brown leather jacket at center, stands taller?" }, { "from": "gpt", "value": "dark brown leather jacket at center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab8c5416578b9f0a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.897, 0.003) or point (0.561, 0.797)?" }, { "from": "gpt", "value": "Point (0.897, 0.003) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd50b8f49fae1623.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a white fluffy cloud at upper center. Pinpoint a point to the white fluffy cloud at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.496, 0.261)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddc2afe6886e65f8.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.767, 0.916) lie behind point (0.723, 0.102)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f1d6bdeca93bd0b.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of white smooth shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.481, 0.534)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/487bda72b19f12e9.jpg", "conversations": [ { "from": "human", "value": "\nWhat is located at the coordinates point (0.553, 0.456) in the image?" }, { "from": "gpt", "value": "The point (0.553, 0.456) indicates the white cotton kimono at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a82acd0738a91481.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of brown wood tree at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.511, 0.283)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d418dd7a320e5cac.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.537, 0.430) or point (0.000, 0.289)?" }, { "from": "gpt", "value": "Point (0.000, 0.289)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c758a2bed81a1fce.jpg", "conversations": [ { "from": "human", "value": "\nWhere is brown sandy beach at lower center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.407, 0.869)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/901524dd31ecd6e8.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to place a new potted plant in the courtyard. The plant needs to be under the white fabric canopy at center to avoid direct sunlight. Where should you position the plant relative to the brown wooden table at center?" }, { "from": "gpt", "value": "The white fabric canopy at center is above the brown wooden table at center, so placing the plant near the brown wooden table at center will ensure it stays under the canopy and out of direct sunlight." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/544950ffe3966604.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to place a package that is 36 inches long on the table. The package must be placed between the brown matte tea at upper center and the edge of the table. Is there enough space?" }, { "from": "gpt", "value": "The brown matte tea at upper center and the viewer are 36.51 inches apart. Since the package is 36 inches long, there is enough space to place it between the brown matte tea at upper center and the edge of the table as the distance is slightly larger than the package length." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6668cacb25622334.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.664, 0.408) and point (0.336, 0.619), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.664, 0.408)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4eb48df257adf77.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the traditional building with the blue and white striped awning. There is a point marked at coordinates (0.641, 0.872). If you want to reach that point, how far do you need to walk from your current position?" }, { "from": "gpt", "value": "The point at (0.641, 0.872) is 11.59 feet away from the viewer, so you need to walk 11.59 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5decdfa7a7231885.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.626, 0.553) from camera?" }, { "from": "gpt", "value": "Point (0.626, 0.553) is 167.99 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/686e41d285251745.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the dark blue fleece at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.300, 0.656)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8c7dc73e3fc7597.jpg", "conversations": [ { "from": "human", "value": "\nIs embroidered fabric blouse at center to the right of white silk headscarf at upper left from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, embroidered fabric blouse at center is positioned on the right side of white silk headscarf at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c3105680b8fd6fb.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the waterfront near PIER 35 and want to walk towards the point labeled point (0.795, 0.958). However, there is an obstacle at point (0.664, 0.889). Will you encounter the obstacle before reaching your destination?" }, { "from": "gpt", "value": "Since point (0.795, 0.958) is in front of point (0.664, 0.889), you will reach point (0.795, 0.958) before encountering the obstacle at point (0.664, 0.889)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/642adf2d08c516ce.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, matte black hair at center or metal mesh table at center, stands taller?" }, { "from": "gpt", "value": "With more height is matte black hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0cbfcfb9358eebe7.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.372, 0.534) and point (0.927, 0.506), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.927, 0.506) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/362ec9ce26f89220.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.692, 0.680) from camera?" }, { "from": "gpt", "value": "Point (0.692, 0.680) and camera are 8.19 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1312e16bcf7c5f7.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, velvet black coat at center or floral silk scarf at center, stands taller?" }, { "from": "gpt", "value": "With more height is velvet black coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17f9195f10a09d02.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.387, 0.806) positioned before point (0.562, 0.641)?" }, { "from": "gpt", "value": "Yes, point (0.387, 0.806) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e47bcb9c19b484a9.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the dining area and want to move closer to the woven wood chair at center. If your current position is 2 meters away from the chair, how many more meters do you need to walk to reach it?" }, { "from": "gpt", "value": "The distance between the woven wood chair at center and the camera is 3.11 meters. Since you are currently 2 meters away, you need to walk an additional 1.11 meters to reach the chair." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/130049fe28dda5c8.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.918, 0.425) or (0.464, 0.380)?" }, { "from": "gpt", "value": "Positioned in front is point (0.918, 0.425)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9889e90b2f9ec8f.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, yellow matte jersey at center or yellow jersey at upper center?" }, { "from": "gpt", "value": "Positioned higher is yellow jersey at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a548ec5ef02dbd5.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of metallic balloons at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.218, 0.472)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/686ee5a06f82dedc.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.508, 0.887)?" }, { "from": "gpt", "value": "fallen leaves at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13f73c094ef3c092.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.296, 0.273) come farther from viewer compared to point (0.633, 0.522)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f16c397f32c00c1.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the Salzach River bridge and want to know the distance between the clear water at center and the white stone church at center. What is the distance between them?" }, { "from": "gpt", "value": "The clear water at center is 51.15 meters away from the white stone church at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cbf039769c2558c.jpg", "conversations": [ { "from": "human", "value": "\nLocate all glossy white panda at center in the image." }, { "from": "gpt", "value": "[(0.485, 0.661)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/200ad51507ce250a.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte phone at center above smooth skin hand at center?" }, { "from": "gpt", "value": "No, black matte phone at center is not above smooth skin hand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/139c780e8314fa3b.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of green grass at center in the image." }, { "from": "gpt", "value": "[(0.518, 0.787)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ced5dcb31e839407.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the base of the mountains and looking up at the white fluffy cloud at upper center. If you want to estimate the distance between you and the cloud, what would be the approximate distance?" }, { "from": "gpt", "value": "The white fluffy cloud at upper center and viewer are 354.61 meters apart, so the approximate distance is 354.61 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/413f229e0886f77b.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.156, 0.158) come behind point (0.772, 0.725)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.772, 0.725)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80ee9b10957d0e53.jpg", "conversations": [ { "from": "human", "value": "\nYou are at an event and want to locate the green glossy table at center. According to the coordinates provided, where would you find it?" }, { "from": "gpt", "value": "The green glossy table at center is located at point coordinates of (0.535, 0.806)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22d808b4297144d8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black wool coat at left is thinner than dark gray uniform at center?" }, { "from": "gpt", "value": "Indeed, black wool coat at left has a lesser width compared to dark gray uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d20629403b5759c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, red matte jacket at lower right or dark blue t-shirt at right, stands shorter?" }, { "from": "gpt", "value": "red matte jacket at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00383d8a0db75865.jpg", "conversations": [ { "from": "human", "value": "\nIs dark wood mirror at upper center to the left of wooden towel bar at center from the viewer's perspective?" }, { "from": "gpt", "value": "No, dark wood mirror at upper center is not to the left of wooden towel bar at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49ab22d83307d412.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture both the fluffy white dog at center and the fuzzy black dog at center in a single frame. Based on their positions, which dog would appear wider in the photo?" }, { "from": "gpt", "value": "The fluffy white dog at center might appear wider than fuzzy black dog at center according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/495eb207cc92f4fa.jpg", "conversations": [ { "from": "human", "value": "\nHow much distance is there between matte black bicycle at center and black matte bicycle at center?" }, { "from": "gpt", "value": "matte black bicycle at center and black matte bicycle at center are 4.89 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74efd996c2ac9477.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.828, 0.494)?" }, { "from": "gpt", "value": "matte black square at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46fd62dd993bcc17.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.219, 0.092) and point (0.876, 0.594), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.876, 0.594)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4990ee682f16da8.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, blue matte water bottle at center or metallic blue car at left?" }, { "from": "gpt", "value": "metallic blue car at left is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92088c87c3ac2261.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.875, 0.556) and point (0.346, 0.508), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.875, 0.556)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ae5e3c256dcde60.jpg", "conversations": [ { "from": "human", "value": "\nLocate green leafy palm tree at center in the image." }, { "from": "gpt", "value": "[(0.734, 0.536)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28dd738e47775f1d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a wildlife photographer trying to capture the leopard in the tree. The brown rough tree trunk at center and the spotted fur leopard at center are both in your viewfinder. Which object appears larger in your photo?" }, { "from": "gpt", "value": "The spotted fur leopard at center appears larger in the photo because the brown rough tree trunk at center is smaller in size compared to it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/318f426652748058.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.344, 0.923) positioned in front of point (0.362, 0.486)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25596d7e62003e63.jpg", "conversations": [ { "from": "human", "value": "\nYou need to place a 15 cm wide package on the table. Which object, the brown cardboard box at center or the gray cotton shirt at upper left, has enough space to accommodate it?" }, { "from": "gpt", "value": "The gray cotton shirt at upper left has a width greater than the brown cardboard box at center. Therefore, the gray cotton shirt at upper left can accommodate the 15 cm wide package." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cde33fb06cb8ea11.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the minimalist room and want to place a small decorative item between the two points, point (0.147, 0.086) and point (0.316, 0.762). Which point should you place it closer to in order to ensure it is more visible from your current position?" }, { "from": "gpt", "value": "You should place the item closer to point (0.147, 0.086) because it is closer to the viewer than point (0.316, 0.762), making it more visible from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5df092c4b208a934.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green leafy tree at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.680, 0.255)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09630d1c1beb9038.jpg", "conversations": [ { "from": "human", "value": "\nBased on the scene description, where is the white matte penguin at center located in terms of its 2D coordinates?" }, { "from": "gpt", "value": "The white matte penguin at center is located at the 2D coordinates point (0.833, 0.483)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1e97ad0a39d2686.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery drone that needs to land on the smooth concrete tarmac at right. However, there is a black metal sculpture at right in the way. Can you safely land on the tarmac without hitting the sculpture?" }, { "from": "gpt", "value": "The smooth concrete tarmac at right is taller than the black metal sculpture at right, so the drone can safely land on the tarmac without hitting the sculpture since the sculpture is lower." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0664c733d4fbc020.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.049, 0.419) closer to viewer compared to point (0.511, 0.902)?" }, { "from": "gpt", "value": "Yes, point (0.049, 0.419) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ace0645504e11bb9.jpg", "conversations": [ { "from": "human", "value": "\nYou are examining the wooden figurine and notice two points marked on it. The first point is at coordinates point (0.913, 0.441) and the second is at point (0.084, 0.367). Which of these points is nearer to you as you look at the figurine?" }, { "from": "gpt", "value": "Point (0.913, 0.441) is closer to the camera than point (0.084, 0.367), so the first point is nearer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcd214ed475e3f53.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark blue water at center is bigger than rocky gray mountain at upper center?" }, { "from": "gpt", "value": "Incorrect, dark blue water at center is not larger than rocky gray mountain at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d70c8daa78bb270.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.892, 0.286)?" }, { "from": "gpt", "value": "A distance of 22.12 meters exists between point (0.892, 0.286) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/608aa2089c1d00f8.jpg", "conversations": [ { "from": "human", "value": "\nIs beige stone hindu temple at center taller than stone stairs at center?" }, { "from": "gpt", "value": "Correct, beige stone hindu temple at center is much taller as stone stairs at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d23b70c00b962456.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.307, 0.386) and camera." }, { "from": "gpt", "value": "A distance of 7.79 meters exists between point (0.307, 0.386) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2721e35974447d6c.jpg", "conversations": [ { "from": "human", "value": "\nBetween white matte board at center and blue denim shirt at right, which one has less height?" }, { "from": "gpt", "value": "Standing shorter between the two is blue denim shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec7575fabbaf400f.jpg", "conversations": [ { "from": "human", "value": "\nYou need to slice the golden brown crusty bread at upper center using the black plastic handle knife at center. Can the knife reach the entire length of the bread?" }, { "from": "gpt", "value": "The golden brown crusty bread at upper center is larger in size than black plastic handle knife at center, so the knife may not be long enough to reach the entire length of the bread." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dce82328c5f6ac7f.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any green stone at center in the image." }, { "from": "gpt", "value": "[(0.454, 0.848)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e90d104100ab89d.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.145, 0.436) or (0.534, 0.330)?" }, { "from": "gpt", "value": "Point (0.534, 0.330)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f25cdad615c32591.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.481, 0.589)?" }, { "from": "gpt", "value": "green matte tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92c35cb906c8e34f.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.036, 0.894) from the camera?" }, { "from": "gpt", "value": "Point (0.036, 0.894) and camera are 20.89 inches apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea7995d54bfb05c5.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.942, 0.330) or point (0.535, 0.464)?" }, { "from": "gpt", "value": "Point (0.942, 0.330) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d12b25ca5cb149b.jpg", "conversations": [ { "from": "human", "value": "\nWhere is blue fabric couch at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.385, 0.728)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e00d812adb4b6a8.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of rusty wood dock at center?" }, { "from": "gpt", "value": "rusty wood dock at center is 11.86 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ee8c9cecbb6c9ac.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown leather jacket at upper center have a lesser width compared to dark green jacket at upper left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ca7dcb92b6090b2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a fashion designer observing a street scene with two central items of clothing, the light blue silk dress at center and the shiny blue shirt at center. Which one has a shorter length?" }, { "from": "gpt", "value": "The light blue silk dress at center is shorter than the shiny blue shirt at center, so the light blue silk dress at center has a shorter length." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c57996d168c6561.jpg", "conversations": [ { "from": "human", "value": "\nIn the urban scene described, there are a black cotton shirt at center and a camouflage fabric rifle at right. From the perspective of an observer facing the scene, which object is positioned to the left?" }, { "from": "gpt", "value": "The black cotton shirt at center is to the left of the camouflage fabric rifle at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ad0e7f8cff9e6f7.jpg", "conversations": [ { "from": "human", "value": "\nLocate the striped cap at center in the image." }, { "from": "gpt", "value": "[(0.822, 0.545)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ea035d08fdf6864.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, leather jacket at lower right or purple sweater at center?" }, { "from": "gpt", "value": "purple sweater at center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26ff014e787c430c.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, gray cloudy sky at upper center or white glossy sailboat at center?" }, { "from": "gpt", "value": "Positioned to the right is gray cloudy sky at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5d6a15b6015c29b.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black suit at center have a greater width compared to black metal tripod at center?" }, { "from": "gpt", "value": "No, matte black suit at center is not wider than black metal tripod at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/289899feaf8d8ef6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing near the wooden wagon at lower left and want to reach the dolphin in the water. How far do you need to walk to get there?" }, { "from": "gpt", "value": "The wooden wagon at lower left is 25.28 feet away from viewer, so you need to walk 25.28 feet to reach the dolphin in the water." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c67eaf5d125978b2.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any wooden door at left in the image." }, { "from": "gpt", "value": "[(0.205, 0.759)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a1bdfd036d60090.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte green plastic box at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.836, 0.220)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d316e10b79a0690.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red blouse at center appear on the left side of smooth white soup at lower center?" }, { "from": "gpt", "value": "In fact, matte red blouse at center is to the right of smooth white soup at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3a941c2cc0a7bcc.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to green grass at center? Please provide its 2D coordinates.Where can I find green grass at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.460, 0.170)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7efa091b9fbecd3.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the purple woven skirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.635, 0.664)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9108d2c0f3ba45ec.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.415, 0.033) and camera." }, { "from": "gpt", "value": "Point (0.415, 0.033) is 4.01 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf376054d35ef315.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to walk to the matte white golf cart at right. How far do you need to walk?" }, { "from": "gpt", "value": "You need to walk 142.28 feet to reach the matte white golf cart at right from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2532450ac011923.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.671, 0.878) positioned before point (0.034, 0.806)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75c6bfc07e87a973.jpg", "conversations": [ { "from": "human", "value": "\nYou are a landscape architect designing a new park and want to place a bench along the path. Given the smooth concrete river at lower right and the red plastic sign at lower right, which one is wider so that the bench can be placed closer to it without obstructing the path?" }, { "from": "gpt", "value": "The smooth concrete river at lower right is wider than the red plastic sign at lower right, so placing the bench closer to the smooth concrete river at lower right would be more appropriate as it allows for more space along the path." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a45f78031b9009c.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is blue glassy water at center from camera?" }, { "from": "gpt", "value": "blue glassy water at center is 380.42 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4215e9c15c632b25.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.479, 0.641)?" }, { "from": "gpt", "value": "blue fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6003e529410a316.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, fluffy white dog at center or fluffy white dog at left?" }, { "from": "gpt", "value": "fluffy white dog at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2d2912e2affa261.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.350, 0.531) or (0.058, 0.502)?" }, { "from": "gpt", "value": "The point (0.058, 0.502) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cb43a08975bf754.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden bookshelf at center to the left of green striped shirt at left from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, wooden bookshelf at center is not on the left side of green striped shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b4c659c833eb32e.jpg", "conversations": [ { "from": "human", "value": "\nIs gray stone statue at center shorter than white fluffy cloud at upper right?" }, { "from": "gpt", "value": "Incorrect, gray stone statue at center's height does not fall short of white fluffy cloud at upper right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea8a1554cc47785a.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist trying to paint a scene that includes the matte beige head at center and the brown glossy eye at center. If you want to maintain the correct proportions between them, which object should you paint larger?" }, { "from": "gpt", "value": "The matte beige head at center should be painted larger than the brown glossy eye at center because it is bigger than the brown glossy eye at center according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01ce052b7cc5bab0.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of white marble statue at center?" }, { "from": "gpt", "value": "The distance of white marble statue at center from camera is 43.23 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bd1f3a566c4833b.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of red sweater at lower center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.343, 0.900)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8709dea5d46414a8.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of matte black car at center in the image." }, { "from": "gpt", "value": "[(0.671, 0.697)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc87500a471e8375.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker trying to locate your skis on the snowy slope. You see the matte white ski at upper left and the matte black ski at lower left. Which ski is located higher on the slope?" }, { "from": "gpt", "value": "The matte white ski at upper left is positioned higher on the slope than the matte black ski at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a3ae42d7b1cb43c.jpg", "conversations": [ { "from": "human", "value": "\nIs black uniform pants at center to the left of matte black shirt at center from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, black uniform pants at center is positioned on the left side of matte black shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ad648bc2232351a.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.332, 0.434) to camera." }, { "from": "gpt", "value": "Point (0.332, 0.434) is 132.01 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/382b44301b90081a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white snow-covered tree at center is bigger than white snow-covered tree at upper right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36081fc9e12ca4e9.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown frothy latte at center appear on the right side of golden brown flaky croissant at left?" }, { "from": "gpt", "value": "Indeed, brown frothy latte at center is positioned on the right side of golden brown flaky croissant at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/118925d0b72561e8.jpg", "conversations": [ { "from": "human", "value": "\nDoes white floral shirt at center appear under brown cotton shirt at left?" }, { "from": "gpt", "value": "Correct, white floral shirt at center is located below brown cotton shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1b854176ec4fe3e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.890, 0.608) positioned after point (0.612, 0.961)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.612, 0.961)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce60ac194cb7af2f.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden table at center bigger than brown leather jacket at upper right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08878b3f288cafa2.jpg", "conversations": [ { "from": "human", "value": "\nIs bare branches at center wider than red tiled roof at center?" }, { "from": "gpt", "value": "Indeed, bare branches at center has a greater width compared to red tiled roof at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bc2355ed25c5191.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of black matte jacket at center in the image." }, { "from": "gpt", "value": "[(0.624, 0.541)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2131db96b29ebb5e.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red santa claus at center thinner than brown leather jacket at lower right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/003955e1419a0bba.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.738, 0.384) positioned behind point (0.109, 0.263)?" }, { "from": "gpt", "value": "No, (0.738, 0.384) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7374c303a89cc13.jpg", "conversations": [ { "from": "human", "value": "\nDoes checkered fabric shirt at left have a greater width compared to glossy wood guitar at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/191885e7ea7cb0ee.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between white fabric canopy at upper center and camera?" }, { "from": "gpt", "value": "They are 45.27 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d3e6bea640d5935.jpg", "conversations": [ { "from": "human", "value": "\nBetween white glossy screen door at left and white matte blinds at right, which one is positioned higher?" }, { "from": "gpt", "value": "Positioned higher is white matte blinds at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/faae01b4de706446.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.190, 0.048) or (0.804, 0.166)?" }, { "from": "gpt", "value": "Point (0.190, 0.048) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/181e9f69ccbec189.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a photo shoot and need to ensure that the red jacket at left and the red knit cap at upper right are visible in the final image. Based on their positions, which object should be placed closer to the camera to ensure both are in focus?" }, { "from": "gpt", "value": "The red jacket at left should be placed closer to the camera because it is positioned under the red knit cap at upper right, meaning it is farther away from the camera. By moving it closer, both objects can be in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b054bff430bb7d7.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.937, 0.427) and point (0.934, 0.461), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.934, 0.461)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5dec63b1325593c7.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of striped cotton shirt at lower right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.807, 0.767)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7875fb46b8a4b6c7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cotton shirt at center is positioned to the left of matte red dress at center?" }, { "from": "gpt", "value": "Incorrect, white cotton shirt at center is not on the left side of matte red dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69ee51aa3d5f0643.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.219, 0.958) closer to camera compared to point (0.560, 0.672)?" }, { "from": "gpt", "value": "Yes, point (0.219, 0.958) is in front of point (0.560, 0.672)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d183f08f6b6bc45.jpg", "conversations": [ { "from": "human", "value": "\nDoes green textured pine tree at right appear under green matte tree at left?" }, { "from": "gpt", "value": "Yes, green textured pine tree at right is below green matte tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f63788b18c2adab6.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, green leafy tree at center or green matte tree at left?" }, { "from": "gpt", "value": "green matte tree at left is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b52e60796c130b21.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of a classic building. There is a dark blue door framed by white ornate columns with decorative carvings. Above the door is a small balcony with a black wrought iron railing. The balcony is supported by two white corbels with carved faces. The steps leading to the door are light stone with wear, and there are black metal railings on both sides. You need to reach a specific point marked at coordinates point (0.456, 0.628). Can you estimate how far this point is from your camera" }, { "from": "gpt", "value": "The distance between point (0.456, 0.628) and the camera is 8.05 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03ab7f1897d99f60.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte snowboard at center is positioned below white snow at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/837d66600ee0ff69.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point with coordinates point (0.453, 0.400) and want to walk to the point with coordinates point (0.787, 0.483). According to the scene, will you be moving towards the background or the foreground?" }, { "from": "gpt", "value": "Since point (0.787, 0.483) is behind point (0.453, 0.400), moving from point (0.453, 0.400) to point (0.787, 0.483) means you are moving towards the background." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/000edd2360de4dec.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green matte tree at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.738, 0.716)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97a2ffea3f34d188.jpg", "conversations": [ { "from": "human", "value": "\nDoes maroon metallic car at center have a lesser height compared to matte red car at center?" }, { "from": "gpt", "value": "Indeed, maroon metallic car at center has a lesser height compared to matte red car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84cf735321cdbc9d.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, dark gray jacket at center or dark blue jacket at center?" }, { "from": "gpt", "value": "With more height is dark gray jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8162fb79d5d3763.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue fleece jacket at center is positioned to the right of white soft fabric baby at center?" }, { "from": "gpt", "value": "No, blue fleece jacket at center is not to the right of white soft fabric baby at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc77b42b04641bf9.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and need to ensure both the matte black dress at center and the clear plastic cup at center are visible in the photo. Given their sizes, which object might require you to adjust your camera focus more carefully to avoid blurring?" }, { "from": "gpt", "value": "The matte black dress at center is larger in size than the clear plastic cup at center, so you may need to adjust the camera focus more carefully on the larger matte black dress at center to ensure both are in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5f24a03671c042b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray cotton shirt at center is positioned above black fabric at lower right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c17c09d8f48e1a29.jpg", "conversations": [ { "from": "human", "value": "\nIs green metallic pole at center to the right of light blue denim shorts at left from the viewer's perspective?" }, { "from": "gpt", "value": "Correct, you'll find green metallic pole at center to the right of light blue denim shorts at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7079a4088ec8c4a0.jpg", "conversations": [ { "from": "human", "value": "\nHow close is gray concrete tarmac at center from metallic silver helicopter at center?" }, { "from": "gpt", "value": "gray concrete tarmac at center and metallic silver helicopter at center are 8.96 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f486deac8adc0809.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a white plastic chair at center. Pinpoint a point to the white plastic chair at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.899, 0.811)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d78dd92c1428526c.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black textured dress at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.210, 0.581)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44e9966a48a6066a.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte shirt at center appear on the left side of white t-shirt at upper center?" }, { "from": "gpt", "value": "Correct, you'll find green matte shirt at center to the left of white t-shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa0202aacee8274d.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.314, 0.666) farther from camera compared to point (0.927, 0.591)?" }, { "from": "gpt", "value": "Yes, point (0.314, 0.666) is farther from viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abf8290ad899561f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte orange shirt at center is smaller than striped cotton dress at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ec2c039e9abb6bc.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.698, 0.253) in front of point (0.662, 0.256)?" }, { "from": "gpt", "value": "Yes, point (0.698, 0.253) is in front of point (0.662, 0.256)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bdafacd7e68ab05.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to black plastic baby carriage at center? Please provide its 2D coordinates.Where can I find black plastic baby carriage at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.683, 0.727)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82bfbc0dc9baefcf.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.425, 0.795) closer to camera compared to point (0.570, 0.653)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d8fef6cf11d8e6b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the metallic grid tower at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.229, 0.352)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d55589ae6ca6f16c.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.906, 0.795) and point (0.755, 0.122), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.906, 0.795) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/004dd1bb774a6a89.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black fishnet gloves at center is positioned above white matte shirt at center?" }, { "from": "gpt", "value": "Incorrect, black fishnet gloves at center is not positioned above white matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0190a9a399fbe1de.jpg", "conversations": [ { "from": "human", "value": "\nYou are an interior designer arranging furniture in a room. You have two items to place on a shelf in front of you. The items are the reflective glass mirror at center and the clear glass window at center. According to the scene, which item should you place to the left side of the shelf?" }, { "from": "gpt", "value": "The clear glass window at center should be placed to the left side of the shelf because the reflective glass mirror at center is to the right of it in the scene." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eeea66797a097a0e.jpg", "conversations": [ { "from": "human", "value": "\nDoes gold-framed painting at upper left have a smaller size compared to bronze statue at center?" }, { "from": "gpt", "value": "Actually, gold-framed painting at upper left might be larger than bronze statue at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57b531faa2e26490.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.909, 0.912) behind point (0.685, 0.472)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a31330d23f5b091.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.984, 0.642) or point (0.034, 0.517)?" }, { "from": "gpt", "value": "Point (0.984, 0.642) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32b41c3deb3935df.jpg", "conversations": [ { "from": "human", "value": "\nIs black sequined tank top at center above blonde hair at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01d018b4e137643d.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of rustic stone buildings at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.505, 0.537)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf26d6740a8f14aa.jpg", "conversations": [ { "from": "human", "value": "\nWhere is denim jacket at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.654, 0.552)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e41c824f84eadd5f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a gardener who wants to mow the lawn. You see the green grass at center and the weathered wood wagon at lower right. Which area should you prioritize mowing first based on their height?" }, { "from": "gpt", "value": "The green grass at center should be prioritized for mowing first since it is much taller than the weathered wood wagon at lower right, indicating it needs attention." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/478699c0ce35f153.jpg", "conversations": [ { "from": "human", "value": "\nIs orange metallic excavator at center in front of yellow plastic tripod at center?" }, { "from": "gpt", "value": "No, orange metallic excavator at center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/242ad686de7f2c8a.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of white smooth shirt at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.768, 0.725)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a055198e99f9bb91.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic wires at center is positioned to the left of bare branches at center?" }, { "from": "gpt", "value": "Indeed, metallic wires at center is positioned on the left side of bare branches at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6813dc844f454192.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.533, 0.537) come in front of point (0.137, 0.394)?" }, { "from": "gpt", "value": "No, (0.533, 0.537) is behind (0.137, 0.394)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f459e7830f982ce.jpg", "conversations": [ { "from": "human", "value": "\nBetween green carved wood door at center and white paper sign at upper center, which one has less height?" }, { "from": "gpt", "value": "Standing shorter between the two is white paper sign at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e8d205d723000fb.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, green fabric curtain at center or polished chrome faucet at center?" }, { "from": "gpt", "value": "polished chrome faucet at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88aba474065e9ff6.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in the crowd at the event. You want to take a closeup photo of the white furry teddy bear at center. Considering your camera can focus on subjects within 50 feet, will you be able to take the photo without moving closer?" }, { "from": "gpt", "value": "The white furry teddy bear at center is 106.74 feet away from the viewer, which is beyond the camera focus range of 50 feet. Therefore, you cannot take a clear closeup photo without moving closer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f75f99f18df8cdb8.jpg", "conversations": [ { "from": "human", "value": "\nWhat are the coordinates of the striped knit beanie at center in the image?" }, { "from": "gpt", "value": "The striped knit beanie at center is located at coordinates (0.358, 0.263)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c431d402f72a0b2d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, yellow matte church at center or white matte building at left?" }, { "from": "gpt", "value": "yellow matte church at center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66d85a1037aae3a9.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is yellow fabric shirt at center from dark blue jacket at lower right?" }, { "from": "gpt", "value": "yellow fabric shirt at center is 23.07 inches from dark blue jacket at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c3ffdf723537546.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, weathered wood door at left or green leafy ivy at lower right?" }, { "from": "gpt", "value": "From the viewer's perspective, green leafy ivy at lower right appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ff8c63c2f49d1d2.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.952, 0.797) in front of point (0.123, 0.891)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/067f0b3897604bcd.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, white matte laptop at center or black plastic ipod at upper right?" }, { "from": "gpt", "value": "black plastic ipod at upper right is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdab0343bf640e36.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.469, 0.900) from the camera?" }, { "from": "gpt", "value": "Point (0.469, 0.900) and camera are 11.17 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/991cf31cb969f5ea.jpg", "conversations": [ { "from": "human", "value": "\nDoes camouflage-patterned jacket at lower right appear on the left side of black matte coat at center?" }, { "from": "gpt", "value": "In fact, camouflage-patterned jacket at lower right is to the right of black matte coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cccb48019918b63.jpg", "conversations": [ { "from": "human", "value": "\nIs green plastic tray at center positioned in front of green plastic shovel at left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/752d100fdebf867f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.144, 0.706)?" }, { "from": "gpt", "value": "black matte suit at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2522fe929d8e55e.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black headband at upper left have a lesser height compared to white matte skull mask at right?" }, { "from": "gpt", "value": "Incorrect, matte black headband at upper left's height does not fall short of white matte skull mask at right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0e485c2a20dc31d.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the wooden barrel at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.544, 0.448)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1411c6e10bcd32ef.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the denim shirt at center and the green leafy tree at upper center in a single frame. Which object should you focus on first if you want to ensure both are in focus without adjusting the camera settings?" }, { "from": "gpt", "value": "The green leafy tree at upper center is larger than the denim shirt at center, so focusing on the tree first would help ensure both are in focus since it occupies more of the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82eb4c59faed9bc2.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the viewer position and want to reach point (0.273, 0.709). How far do you need to walk to get there?" }, { "from": "gpt", "value": "You need to walk 14.21 meters to reach point (0.273, 0.709) from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16de3a729fa9d203.jpg", "conversations": [ { "from": "human", "value": "\nYou are a farmer planning to install a new fence post between the white matte barn at center and the silver metallic silo at center. Considering their widths, which structure requires more space to accommodate the post without overlapping?" }, { "from": "gpt", "value": "The white matte barn at center has a greater width than the silver metallic silo at center, so it requires more space to accommodate the post without overlapping." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f79fabe2eb7ed37.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect assessing the statues in front of the classical building. You need to determine which statue is taller between the white marble statue at center and the white marble statue at left. Based on the scene, which one is taller?" }, { "from": "gpt", "value": "The white marble statue at center is much taller than the white marble statue at left according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/153471b278bfa1ea.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of dark blue t-shirt at center from camera?" }, { "from": "gpt", "value": "The distance of dark blue t-shirt at center from camera is 3.85 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c533f38d3406e2d5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if beige textured desk at center is positioned below white glossy table at lower right?" }, { "from": "gpt", "value": "Actually, beige textured desk at center is above white glossy table at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca37348dff7b41bf.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte car at center is bigger than plaid shirt at center?" }, { "from": "gpt", "value": "Indeed, green matte car at center has a larger size compared to plaid shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/025dc48be9d657fe.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.513, 0.950) lie behind point (0.710, 0.827)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8a61090e4606588.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point labeled as point (0.973, 0.622) in the train station platform. If you want to take a photo of the brick wall with murals on the left side, how far do you need to walk towards the wall to ensure the entire wall is in your camera frame?" }, { "from": "gpt", "value": "The point labeled (0.973, 0.622) is 12.99 meters away from the camera. To capture the entire brick wall with murals on the left side in your camera frame, you would need to move closer to the wall until the distance between you and the camera is less than 12.99 meters. However, the exact distance required depends on the camera lens and sensor size, which are not provided here." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7da3a696783acd7.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.714, 0.644) and point (0.389, 0.419), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.714, 0.644)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d63c538f39d471d8.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy palm tree at center taller than transparent plastic goggles at lower left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c0811f18a705b38.jpg", "conversations": [ { "from": "human", "value": "\nHow close is blue glossy bottle at center from camera?" }, { "from": "gpt", "value": "blue glossy bottle at center is 5.65 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb23bc933ea17c3c.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.933, 0.586) positioned after point (0.608, 0.489)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7993150485b4eea2.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the square in front of the cathedral and see the dark blue jeans at center and the dark gray fabric coat at center. Which item is larger in size?" }, { "from": "gpt", "value": "The dark blue jeans at center is bigger than the dark gray fabric coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be853c2713a37d0a.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray jacket at center appear under matte blue puffer jacket at lower left?" }, { "from": "gpt", "value": "Incorrect, dark gray jacket at center is not positioned below matte blue puffer jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61af3c7943b93858.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray stone head at center have a larger size compared to smooth stone head at upper center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1284c8712b5e8aca.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.237, 0.805) in front of point (0.531, 0.484)?" }, { "from": "gpt", "value": "Yes, point (0.237, 0.805) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7004d94ec69130a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, white plastic container at left or high visibility yellow vest at center?" }, { "from": "gpt", "value": "high visibility yellow vest at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04f31161fdd55209.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black shorts at center below neon yellow mesh sneaker at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f6ff910093557fb.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the navy blue uniform at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.789, 0.753)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d178a4e23f2de1d.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.263, 0.620) positioned after point (0.397, 0.825)?" }, { "from": "gpt", "value": "Yes, point (0.263, 0.620) is behind point (0.397, 0.825)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/212e98bb2c1891ab.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green plastic robot at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.305, 0.569)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4a3be1254f50ded.jpg", "conversations": [ { "from": "human", "value": "\nHow far is snowy rock mountain at upper left from brown textured tree at right?" }, { "from": "gpt", "value": "885.75 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9675855ee94f0b9.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of satin silver sedan at lower center from camera?" }, { "from": "gpt", "value": "A distance of 59.39 meters exists between satin silver sedan at lower center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27d24131cc9cbf1f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the riverbank and see two points marked in the image. Which point is nearer to you, point (0.213, 0.780) or point (0.673, 0.523)?" }, { "from": "gpt", "value": "Point (0.213, 0.780) is closer to the viewer than point (0.673, 0.523)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02c40c3e76e7c9b9.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.881, 0.314) closer to viewer compared to point (0.358, 0.277)?" }, { "from": "gpt", "value": "No, it is behind (0.358, 0.277)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bec3b9e59f848e7d.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a dark purple shirt at center. Pinpoint a point to the dark purple shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.754, 0.698)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6a987cb54b9c88b.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.203, 0.358)." }, { "from": "gpt", "value": "blue fabric shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fadf60ed46da4f5.jpg", "conversations": [ { "from": "human", "value": "\nLocate all matte gray sweater at center in the image." }, { "from": "gpt", "value": "[(0.497, 0.617)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abc7225545161082.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at lower center bigger than brown tiled roof hut at center?" }, { "from": "gpt", "value": "Incorrect, green grass at lower center is not larger than brown tiled roof hut at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6cdcf70a1e23e7a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if striped cotton shirt at center is positioned above gray fabric backpack strap at center?" }, { "from": "gpt", "value": "Incorrect, striped cotton shirt at center is not positioned above gray fabric backpack strap at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a54cb29d01b189a6.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, dark gray fabric jacket at lower left or black leather jacket at lower right?" }, { "from": "gpt", "value": "black leather jacket at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7827d77937b22eff.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.635, 0.594) farther from viewer compared to point (0.960, 0.436)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2be736e6829f46fc.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.123, 0.631) and point (0.066, 0.195), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.123, 0.631)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/753a12a3d621d854.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.717, 0.489) and camera." }, { "from": "gpt", "value": "Point (0.717, 0.489) and camera are 7.56 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14561351f912a985.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a matte green mermaid statue at left. Pinpoint a point to the matte green mermaid statue at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.335, 0.683)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16b41120e06187a0.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.093, 0.866)?" }, { "from": "gpt", "value": "pearl earrings at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0012e8a538b00ebf.jpg", "conversations": [ { "from": "human", "value": "\nBetween clear glass wine glass at center and yellow gelatinous cubes at center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "yellow gelatinous cubes at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/daaa637b1512f6c0.jpg", "conversations": [ { "from": "human", "value": "\nLocate all smooth stone alley at center in the image." }, { "from": "gpt", "value": "[(0.499, 0.897)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c3d24bfaa18526c.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the silver metallic bicycle wheel at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.608, 0.050)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2347d406b5d085cc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown pinstriped suit at center is taller than black fabric dress at center?" }, { "from": "gpt", "value": "Correct, brown pinstriped suit at center is much taller as black fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c4fb3c10bb304b6.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of printed cotton dress at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.762, 0.411)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96b9491ffa7ada4a.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of white frothy milkshake at center?" }, { "from": "gpt", "value": "white frothy milkshake at center is 1.71 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd76fac894f3bf2b.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.941, 0.417) farther from camera compared to point (0.013, 0.522)?" }, { "from": "gpt", "value": "Yes, point (0.941, 0.417) is behind point (0.013, 0.522)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b1623d002de377f.jpg", "conversations": [ { "from": "human", "value": "\nLocate the white marble statue at right in the image." }, { "from": "gpt", "value": "[(0.812, 0.880)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e26baf9ed0377c17.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.409, 0.670) and camera." }, { "from": "gpt", "value": "Point (0.409, 0.670) and camera are 4.26 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5efeeecd4d58356c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, natural wood bookshelf at left or camel wool coat at center, stands taller?" }, { "from": "gpt", "value": "natural wood bookshelf at left is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67cb0f9ebf786b4c.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a red jacket at lower left. Pinpoint a point to the red jacket at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.129, 0.778)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d095ee0f92c6c0f7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear plastic mattress at center is smaller than dark gray t-shirt at center?" }, { "from": "gpt", "value": "Correct, clear plastic mattress at center occupies less space than dark gray t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc5cb4f3aaf25a84.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the beach and looking through the palm tree fronds. There are two points marked in the image. Which point is closer to you, point (0.090, 0.738) or point (0.686, 0.184)?" }, { "from": "gpt", "value": "Point (0.090, 0.738) is closer to you because it is further to the camera than point (0.686, 0.184)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf99dcb9472aa860.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of gray asphalt pavement at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.309, 0.720)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79242dcbb6d8a2c0.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.566, 0.637) and camera." }, { "from": "gpt", "value": "They are 9.53 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60ebf2c3b945661b.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, black matte text at upper center or black matte keyboard at lower left?" }, { "from": "gpt", "value": "black matte keyboard at lower left is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6dc2dd285367cf6d.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.578, 0.820) to camera." }, { "from": "gpt", "value": "Point (0.578, 0.820) and camera are 38.60 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8768dbf99187536.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any white paper at left in the image." }, { "from": "gpt", "value": "[(0.195, 0.427)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de0d2e1e592237df.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of black matte scarf at lower center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.783, 0.789)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aed6e6b4b9a20b46.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the grassy area with scattered white flowers and surrounded by trees. You see two points marked in the image. Which point is closer to you, point (0.155, 0.784) or point (0.249, 0.528)?" }, { "from": "gpt", "value": "Point (0.155, 0.784) is closer to you than point (0.249, 0.528)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c438c76de927c73.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if silver metallic laptop at lower right is bigger than white striped shirt at center?" }, { "from": "gpt", "value": "Actually, silver metallic laptop at lower right might be smaller than white striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fc8688599981f2b.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.129, 0.316) or (0.452, 0.459)?" }, { "from": "gpt", "value": "Point (0.129, 0.316) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a37995377a3b21b6.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.963, 0.669) and point (0.569, 0.567), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.569, 0.567) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69f3e90965222591.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the camera position. You want to place a 2.5 meter long banner between you and the white plastic boat at center. Will the banner fit in the space between you and the boat?" }, { "from": "gpt", "value": "The distance between the camera and the white plastic boat at center is 3.73 meters. Since the banner is 2.5 meters long, it will fit in the space between you and the boat." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd67bfc6fe27f88e.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.125, 0.347)?" }, { "from": "gpt", "value": "silver tarpaulin tent at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0aa7cc57f2101604.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the matte white shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.257, 0.472)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b110d169d968a0db.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.920, 0.975) on the road. You want to walk to the camera position. How far do you need to walk?" }, { "from": "gpt", "value": "You need to walk 39.95 feet to reach the camera position from point (0.920, 0.975)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1af7a9b4a3998f12.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to adjust the focus of your camera. You notice two objects in the frame that are important for the shot. The matte black thumb at center and the brown leather hand at lower right. Which object should you focus on first to ensure it appears sharp in the photo?" }, { "from": "gpt", "value": "The matte black thumb at center should be focused on first since it is closer to the viewer than the brown leather hand at lower right, so focusing on it first will ensure it appears sharp." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad4771903f00c763.jpg", "conversations": [ { "from": "human", "value": "\nBetween translucent plastic cup at lower center and translucent plastic cup at center, which one has less height?" }, { "from": "gpt", "value": "translucent plastic cup at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f620cb3ecec81e8.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.396, 0.500) to camera." }, { "from": "gpt", "value": "Point (0.396, 0.500) is 12.17 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa0344ea3a8fc987.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth wood deck at center positioned at the back of wooden deck at center?" }, { "from": "gpt", "value": "No, it is in front of wooden deck at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/682edb243e93e4c2.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from glassy transparent bridge at center to translucent glass sculpture at center." }, { "from": "gpt", "value": "glassy transparent bridge at center is 60.88 feet away from translucent glass sculpture at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96fecc4408b24a6f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer who just took a picture of a busy street in a city. You notice that the image is overexposed, making most details hard to see. However, you recall that there was a person wearing a dark blue suit standing at a specific location. Using the coordinates provided, can you determine if the dark blue suit at center is positioned closer to the top or bottom of the image?" }, { "from": "gpt", "value": "The dark blue suit at center is located at point (0.248, 0.516). Since the y coordinate is 0.248, which is closer to 0.0 than 1.0, the dark blue suit at center is positioned closer to the bottom of the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d460b02081b971d3.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the ice cream shop on the left side of the street. You want to hand a flyer to a person wearing the dark blue jacket at center and the dark gray sweater at center. Which one is closer to you?" }, { "from": "gpt", "value": "The dark blue jacket at center is 5.68 meters away from the dark gray sweater at center. Since you are at the entrance, the person wearing the dark gray sweater at center is closer to you than the dark blue jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b5447638ecc66b2.jpg", "conversations": [ { "from": "human", "value": "\nIs brown dirt track at center smaller than black rubber boot at lower right?" }, { "from": "gpt", "value": "Yes, brown dirt track at center is smaller than black rubber boot at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75c8d00824dcc36f.jpg", "conversations": [ { "from": "human", "value": "\nLocate smooth skin at back in the image." }, { "from": "gpt", "value": "[(0.487, 0.534)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/005f51a489e98972.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.588, 0.891) positioned behind point (0.048, 0.716)?" }, { "from": "gpt", "value": "No, it is in front of (0.048, 0.716)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83d14c5d029edf1f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a bartender preparing a drink and need to place a clear glass bottle at center and a green leafy plant at upper center on a shelf. The shelf is only 5 inches wide. Can both items fit side by side without overlapping?" }, { "from": "gpt", "value": "The clear glass bottle at center is 4.21 inches from the green leafy plant at upper center, so yes, both items can fit side by side on the 5 inch wide shelf since the total required space is less than 5 inches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0da8b15e7202689.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the camera position. You want to take a closeup photo of the brown leather jacket at center. Can you reach it without moving your position?" }, { "from": "gpt", "value": "The brown leather jacket at center is 2.84 meters away from camera, so yes, you can reach it without moving your position as it is within a typical camera focusing range." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/881fc87a6cc88893.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the group of people on the stone bench. Which object is located at the coordinates point (0.141, 0.611)?" }, { "from": "gpt", "value": "The point (0.141, 0.611) corresponds to the matte gold tunic at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c7eb88910efe286.jpg", "conversations": [ { "from": "human", "value": "\nIs dirt track at center to the right of green textured tree at center from the viewer's perspective?" }, { "from": "gpt", "value": "No, dirt track at center is not to the right of green textured tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34579536473ef00a.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the green leafy cabbage at upper left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.219, 0.234)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bcee23eb3fd9fe9.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.423, 0.719) or (0.526, 0.103)?" }, { "from": "gpt", "value": "Point (0.423, 0.719) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e282fce140533bb.jpg", "conversations": [ { "from": "human", "value": "\nYou are a passenger sitting in the green polished wood horse cart at center. You want to pat the brown glossy horse at center. Can you reach the horse from your current position?" }, { "from": "gpt", "value": "The green polished wood horse cart at center is above the brown glossy horse at center, so you can reach the horse by leaning forward or stepping down from the cart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72bd0f738c2b2f9a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and need to capture a photo that includes both the black leather jacket at lower left and the blue stretchy sock at lower right. The camera you are using has a maximum focus range of 4 feet. Can you fit both objects in the frame without moving the camera?" }, { "from": "gpt", "value": "The black leather jacket at lower left and blue stretchy sock at lower right are 4.52 feet apart from each other. Since the maximum focus range is 4 feet, the distance between them exceeds the camera capability. Therefore, you cannot fit both objects in the frame without moving the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f1da4599fc82384.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the matte black jacket at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.115, 0.463)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6dc1120f4304b173.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.839, 0.294) in front of point (0.179, 0.713)?" }, { "from": "gpt", "value": "No, it is behind (0.179, 0.713)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6629b572601749c.jpg", "conversations": [ { "from": "human", "value": "\nBetween gray suit at center and matte black suit at left, which one has less height?" }, { "from": "gpt", "value": "matte black suit at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6239c8b89b9d1c14.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.683, 0.441) positioned before point (0.531, 0.572)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1691f43fc2af875f.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the dark matte clothing at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.231, 0.506)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aeb916967f509d51.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.725, 0.916) and point (0.305, 0.364), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.725, 0.916) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4ad3b0977f63fc4.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the waterfall scene. Which direction should you walk to reach the green leafy tree at left?" }, { "from": "gpt", "value": "The green leafy tree at left is located to the left side of the scene, so you should walk towards the left to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc83108c90798772.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, green leafy tree at center or yellow-green leafy tree at right?" }, { "from": "gpt", "value": "Positioned higher is yellow-green leafy tree at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65d3f8e2765acc07.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.427, 0.450) and camera." }, { "from": "gpt", "value": "Point (0.427, 0.450) and camera are 1.69 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba41b86775f0a945.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer sitting at the wooden table in the image. You want to place your phone on the table but need to ensure there is enough space. The phone measures 15 cm in length. Can you determine if there is sufficient space on the table next to the blue plush elephant at center?" }, { "from": "gpt", "value": "The blue plush elephant at center is located at point coordinates, but without knowing the table dimensions or the available space around the elephant, it is impossible to determine if the phone will fit. Additional information about the table size or the elephant placement relative to the table edges is needed." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf453a2d94805d7e.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between purple fabric mat at lower center and camera?" }, { "from": "gpt", "value": "They are 5.58 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c7156f565e73649.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.096, 0.800)?" }, { "from": "gpt", "value": "The distance of point (0.096, 0.800) from camera is 1.43 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b591c2e5e8a59e09.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of stained glass window at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.485, 0.103)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0154df276cd4cf14.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of brown fabric child at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.444, 0.561)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63663acd1870d07c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the origin point of the coordinate system in the image. You want to move towards the white sheer blouse at center. In which direction should you move?" }, { "from": "gpt", "value": "Since the white sheer blouse at center is located at coordinate point 0.616 on the x axis and 0.404 on the y axis, you should move towards the right and slightly forward to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a55428e09637eae.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer adjusting the camera settings for a group photo. You notice the satin black dress at left and the satin brown top at center. Which clothing item should you focus on first if you want to ensure both are in focus, considering their positions?" }, { "from": "gpt", "value": "The satin black dress at left should be focused on first since it is located above the satin brown top at center, allowing the depth of field to cover both items effectively." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad0d8e488570ba61.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of transparent glass window at center in the image." }, { "from": "gpt", "value": "[(0.492, 0.389)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c11035a79cf0815.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of beige sand at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.464, 0.892)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5aef42c4fc1920ac.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of leopard print shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.412, 0.686)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fab7c1713497bfc.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the black matte monitor at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.233, 0.320)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40846d79c138388b.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.441, 0.475) come behind point (0.089, 0.428)?" }, { "from": "gpt", "value": "No, it is in front of (0.089, 0.428)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/766673eb4aad35b1.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in an autumn scene with bright red bushes in the foreground and trees with yellow and orange leaves in the background. There is a point marked at coordinates point (0.482, 0.370). If you want to place a small decorative rock exactly at that point, how far should you walk forward from your current position to reach it?" }, { "from": "gpt", "value": "The distance of point (0.482, 0.370) from viewer is 10.92 meters, so you should walk forward 10.92 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d090101ddb03cb25.jpg", "conversations": [ { "from": "human", "value": "\nDoes marble column at center have a greater width compared to beige marble column at center?" }, { "from": "gpt", "value": "Correct, the width of marble column at center exceeds that of beige marble column at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a412886003aca978.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.623, 0.531)?" }, { "from": "gpt", "value": "matte black jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/269669a4f9c57eef.jpg", "conversations": [ { "from": "human", "value": "\nIs camouflage fabric uniform at center positioned at the back of dark gray uniform at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb2344804f80db89.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of silver metallic ferris wheel at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.263, 0.683)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82cd422478b7ece3.jpg", "conversations": [ { "from": "human", "value": "\nBetween white textured building at center and green metallic street sign at upper right, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "white textured building at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61e632c8af3811b3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.621, 0.917) or point (0.283, 0.305)?" }, { "from": "gpt", "value": "The point (0.283, 0.305) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/149b76892cf9afc3.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the yellow matte shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.234, 0.645)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/044d1828f42d7027.jpg", "conversations": [ { "from": "human", "value": "\nLocate all wooden table at center in the image." }, { "from": "gpt", "value": "[(0.499, 0.858)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e635e24ec1502ee3.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.894, 0.352) or (0.258, 0.495)?" }, { "from": "gpt", "value": "The point (0.258, 0.495) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c26c8a8f6a2a6b04.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if purple cotton shirt at center is positioned above matte gray t-shirt at center?" }, { "from": "gpt", "value": "Correct, purple cotton shirt at center is located above matte gray t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b15f1155077a5c6.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.671, 0.828) or (0.798, 0.541)?" }, { "from": "gpt", "value": "Point (0.798, 0.541)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/737371588b28e6f7.jpg", "conversations": [ { "from": "human", "value": "\nPoint to beige stone column at center.Point to the beige stone column at center in the image." }, { "from": "gpt", "value": "[(0.300, 0.719)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d30d94ba46787258.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red scarf at center have a smaller size compared to blue denim jacket at lower left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a199f8ffe7cef4c.jpg", "conversations": [ { "from": "human", "value": "\nIs rustic sandstone rock formation at center above snow-covered rock formation at upper right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f053af9f118ece9.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.790, 0.958) and camera." }, { "from": "gpt", "value": "They are 31.75 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b88b85dc7797158.jpg", "conversations": [ { "from": "human", "value": "\nIs white snow ski slope at center further to the viewer compared to orange softshell jacket at center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20aa8c96c798de51.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.468, 0.653) closer to viewer compared to point (0.389, 0.412)?" }, { "from": "gpt", "value": "No, it is behind (0.389, 0.412)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ecec9ef156dfdd70.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the brown murky water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.779, 0.812)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3905d71b7806beda.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the baseball stadium and want to take a photo of both the banner and the upper stands. The banner is located at point (0.678, 0.662) and the upper stands are at point (0.919, 0.903). Based on their positions, which object is closer to you?" }, { "from": "gpt", "value": "Point (0.919, 0.903) is closer to you than point (0.678, 0.662), so the upper stands are closer to you than the banner." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96ee339ace0bdabb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow matte flowers at center is smaller than blue glossy statue at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5798cf1dd132e981.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the origin point of the image coordinate system. You see a matte blue dress at center located at point (0.531, 0.617). If you want to walk towards the matte blue dress at center, which direction should you move in terms of the coordinate system?" }, { "from": "gpt", "value": "The matte blue dress at center is located at point (0.531, 0.617), so you should move towards the positive x and y directions to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfbd83cf972aa84c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in a high rise building. You want to take a photo of the cityscape through the transparent glass window at center while wearing the matte blue shirt at center. Considering the distance between the shirt and the window, will you be able to avoid your reflection appearing in the photo?" }, { "from": "gpt", "value": "The distance between the transparent glass window at center and the matte blue shirt at center is 98.71 meters. Since the photographer is standing 98.71 meters away from the window, their reflection would not appear in the photo as they are too far from the glass surface to be reflected." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1e4982b7257caca.jpg", "conversations": [ { "from": "human", "value": "\nYou are a maintenance worker tasked with checking the safety of the balustrades and rails at the building entrance. You have a measuring tape and need to determine which one is wider between the metallic gray balustrade at upper center and the metallic rail at lower center without direct measurement. Based on the scene description, which one should you prioritize checking first due to its width?" }, { "from": "gpt", "value": "The metallic gray balustrade at upper center is wider than the metallic rail at lower center, so you should prioritize checking the metallic gray balustrade at upper center first due to its larger width." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aec620b5d80203a9.jpg", "conversations": [ { "from": "human", "value": "\nHow far is green grass at center from camera?" }, { "from": "gpt", "value": "A distance of 4.04 feet exists between green grass at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/849f3fd7ac2072d2.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.626, 0.037) from the camera?" }, { "from": "gpt", "value": "The distance of point (0.626, 0.037) from camera is 3.44 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/494c4cd1af8e1661.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of white fluffy snow at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.495, 0.719)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0888345b813c9f20.jpg", "conversations": [ { "from": "human", "value": "\nYou are a parent looking for a place to put a baby bottle. You see the clear glass window at center and the clear plastic dishwasher at lower left. Which object is closer to you, and can you place the baby bottle on it?" }, { "from": "gpt", "value": "The clear glass window at center is in front of the clear plastic dishwasher at lower left, so the window is closer. However, the window is likely not a suitable surface for placing the baby bottle as it is a window. The dishwasher might be open, but it contains dishes and bottles already. Consider using the wooden table instead which is mentioned in the scene description as having a baby bottle already present." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77724869314a75a7.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the gray stone ledge at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.483, 0.822)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d82ca92c82cf1861.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.085, 0.431) and camera?" }, { "from": "gpt", "value": "A distance of 9.15 meters exists between point (0.085, 0.431) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c11d5595bad24fd.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of smooth gray water at lower right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.759, 0.880)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6390c8a1c6b108c8.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.884, 0.245)?" }, { "from": "gpt", "value": "smooth skin face at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1acac8db3a9b95c5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.053, 0.289)?" }, { "from": "gpt", "value": "green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/663801fea66411f4.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of smooth bark tree at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.407, 0.206)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cd4fe35a544d58a.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the yellow fabric tank top at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.124, 0.477)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95d49c078f422088.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the green concrete pool at lower left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.255, 0.825)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9dd05270786d91a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, dark green sweater at center or blue shirt at upper right, stands shorter?" }, { "from": "gpt", "value": "Standing shorter between the two is blue shirt at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de38f9a1015b9f95.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.176, 0.347) closer to viewer compared to point (0.743, 0.170)?" }, { "from": "gpt", "value": "No, (0.176, 0.347) is further to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/832c5387f9f65342.jpg", "conversations": [ { "from": "human", "value": "\nBetween green leafy palm tree at center and matte purple shirt at center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "green leafy palm tree at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a30a805272700fe4.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.494, 0.428)?" }, { "from": "gpt", "value": "black lace lingerie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/370c20a5830ab690.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.338, 0.580)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e41371abc73f399c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of black asphalt road at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.733, 0.883)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e94d4bfc7e0d12a.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the blue fabric umbrella at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.781, 0.420)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6fdb92954d90dbd8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if american flag at right is bigger than light brown wood construction worker at upper center?" }, { "from": "gpt", "value": "Yes, american flag at right is bigger than light brown wood construction worker at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffd4ff641f647696.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green grassy at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.479, 0.822)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bd296d2aeceba12.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, stone ruins at center or purple fabric at lower right?" }, { "from": "gpt", "value": "Positioned lower is purple fabric at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/132471d2a85c4a9e.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, blue fabric jacket at lower left or blue sweater at left?" }, { "from": "gpt", "value": "From the viewer's perspective, blue fabric jacket at lower left appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00863c5b0017c8f0.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.787, 0.528)?" }, { "from": "gpt", "value": "light blue smooth egg at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae660799ff701fd0.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the bronze sculpture on the rocky base. You notice a specific point marked at coordinates point (0.515, 0.380). How far is that point from your current position?" }, { "from": "gpt", "value": "The point (0.515, 0.380) is 4.83 meters from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c6a08e7ca42c765.jpg", "conversations": [ { "from": "human", "value": "\nYou are a stage designer checking the outfits displayed on the stage. You notice the golden fabric dress at center and the matte yellow sweater at center. Which outfit takes up more horizontal space on the stage?" }, { "from": "gpt", "value": "The golden fabric dress at center has a greater width than the matte yellow sweater at center, so it takes up more horizontal space on the stage." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/555f8acd61966dba.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between striped cotton shirt at center and camera." }, { "from": "gpt", "value": "The distance of striped cotton shirt at center from camera is 1.71 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84eeae4ed73608d7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if silver metallic suv at lower right is positioned to the left of shiny black car at lower left?" }, { "from": "gpt", "value": "No, silver metallic suv at lower right is not to the left of shiny black car at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1125bc127db5e50c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if frosted wood tree at left is taller than frosted branches at center?" }, { "from": "gpt", "value": "Yes, frosted wood tree at left is taller than frosted branches at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0d946a05b7a2b1b.jpg", "conversations": [ { "from": "human", "value": "\nIs matte orange guitar at left taller than orange wood guitar at left?" }, { "from": "gpt", "value": "Yes, matte orange guitar at left is taller than orange wood guitar at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21800f788b24ec7d.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between shiny black uniform at center and camera?" }, { "from": "gpt", "value": "shiny black uniform at center is 4.91 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1c300cdb7d5375a.jpg", "conversations": [ { "from": "human", "value": "\nIs white shirt at left above matte white dress at center?" }, { "from": "gpt", "value": "No, white shirt at left is not above matte white dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79bbb7b925db35ba.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte pink leggings at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.576, 0.778)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb55f6e754232f89.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the camouflage fabric pants at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.590, 0.295)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e7530d6717c31c6.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.840, 0.722) and point (0.692, 0.567), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.692, 0.567) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7407c323881d3e4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer taking a picture of the person in the scene. You want to ensure that both the dark brown hair at center and the yellow printed bikini top at center are clearly visible in the frame. Which object should you adjust your focus on first to ensure proper alignment?" }, { "from": "gpt", "value": "The dark brown hair at center is positioned on the right side of yellow printed bikini top at center. Since the hair is on the right, you should focus on the dark brown hair at center first to ensure proper alignment with the bikini top." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91a307fac18777dd.jpg", "conversations": [ { "from": "human", "value": "\nYou are a guest at a garden party and want to sit as close as possible to the charcoal wood fire at center without getting too warm. The white plastic chair at upper center is available. How far is the chair from the fire?" }, { "from": "gpt", "value": "The distance between the white plastic chair at upper center and the charcoal wood fire at center is 3.47 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ade169a944a98d1f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked by coordinates point (0.523, 0.831) and want to reach the modern building with large glass windows on the left bank of the river. Which direction should you move to get there?" }, { "from": "gpt", "value": "The blue water at lower left is represented by point (0.523, 0.831). To reach the modern building with large glass windows on the left bank of the river, you should move towards the left bank, which is the opposite direction of the right bank where the red brick structure is located." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57241fc82305cab3.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.796, 0.750) farther from viewer compared to point (0.448, 0.306)?" }, { "from": "gpt", "value": "Yes, point (0.796, 0.750) is farther from viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2ba85aa56d0e6d7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if glossy metallic mirror at center is shorter than blue fabric person at center?" }, { "from": "gpt", "value": "No, glossy metallic mirror at center is not shorter than blue fabric person at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27970ea3ee11514a.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of blue cotton shirt at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.535, 0.458)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1acf7327cc2b4d69.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte blue cap at left and blue fabric tank top at right, which one has less height?" }, { "from": "gpt", "value": "Standing shorter between the two is matte blue cap at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b05908ceac619768.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, green woven fabric at upper left or matte gray kimono at center?" }, { "from": "gpt", "value": "Standing shorter between the two is matte gray kimono at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79ac7b296d54afc0.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a matte black face at upper left. Pinpoint a point to the matte black face at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.476, 0.197)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e3d1613460f44a0.jpg", "conversations": [ { "from": "human", "value": "\nIs white fluffy cat at center bigger than white fur paw at lower center?" }, { "from": "gpt", "value": "Indeed, white fluffy cat at center has a larger size compared to white fur paw at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c045133583781cb.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, green plastic toy at lower right or rubberized plastic toy car at center?" }, { "from": "gpt", "value": "rubberized plastic toy car at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/edfa826288e037f5.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.828, 0.752) lie behind point (0.729, 0.259)?" }, { "from": "gpt", "value": "No, (0.828, 0.752) is in front of (0.729, 0.259)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c767b185642504fd.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer analyzing the composition of this black and white photo. You notice two clothing items worn by the woman in the scene. The dark fabric skirt at center and the white soft sweater at center. Which clothing item is positioned lower on her body?" }, { "from": "gpt", "value": "The dark fabric skirt at center is below the white soft sweater at center, so the dark fabric skirt at center is positioned lower on her body." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b248fd47d3078c50.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tourist at the floating market and want to buy fried rice. You see the purple fabric at center and the yellow fabric shirt at center. Which item is smaller in size?" }, { "from": "gpt", "value": "The purple fabric at center is smaller than the yellow fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/978941eb6acdbd27.jpg", "conversations": [ { "from": "human", "value": "\nYou are a dog trainer assessing the spacing between the black furry dog at left and the white fluffy dog at center on the couch. Based on the image, can you confirm if there is enough space to comfortably fit a third dog between them?" }, { "from": "gpt", "value": "The distance between the black furry dog at left and the white fluffy dog at center is 36.23 centimeters. Depending on the size of the third dog, this space may or may not be sufficient. For smaller breeds, it could be adequate, but larger dogs might require more room." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11a51804a07eefb8.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green grassy at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.610, 0.856)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df4074510ddb8c64.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the beach and see the green translucent water at lower center and the green fabric shorts at lower right. Which object is closer to the left side of your view?" }, { "from": "gpt", "value": "The green translucent water at lower center is to the left of the green fabric shorts at lower right, so it is closer to the left side of your view." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c84aca2dae67230.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in a forest clearing and see the natural wood cabin at center. If you want to walk towards the cabin, how many meters do you need to walk to reach it?" }, { "from": "gpt", "value": "The distance between you and the natural wood cabin at center is 10.51 meters, so you need to walk 10.51 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07082b5fef862157.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.568, 0.217) or point (0.609, 0.544)?" }, { "from": "gpt", "value": "Point (0.609, 0.544)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a966edd193f04c3.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of pink polka dot pajamas at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.438, 0.647)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2832614f6511bf53.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth water at boat right taller than thick green foliage at upper left?" }, { "from": "gpt", "value": "Incorrect, smooth water at boat right's height is not larger of thick green foliage at upper left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a2296bc7d59d663.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte water at center have a lesser height compared to green leafy trees at upper center?" }, { "from": "gpt", "value": "Indeed, green matte water at center has a lesser height compared to green leafy trees at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adac7895226e46f6.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.341, 0.117) come behind point (0.847, 0.302)?" }, { "from": "gpt", "value": "Yes, point (0.341, 0.117) is behind point (0.847, 0.302)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c02b0600039750a3.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.462, 0.808) or (0.595, 0.447)?" }, { "from": "gpt", "value": "Point (0.595, 0.447)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f17ed7dafd0a41f.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.882, 0.000) farther from viewer compared to point (0.432, 0.997)?" }, { "from": "gpt", "value": "Yes, point (0.882, 0.000) is behind point (0.432, 0.997)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2d37a08ca69a71b.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white glossy balloon at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.603, 0.161)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4295a75c61f51f8a.jpg", "conversations": [ { "from": "human", "value": "\nHow far apart are smooth skin man at center and slightly tanned skin at upper center?" }, { "from": "gpt", "value": "smooth skin man at center is 4.60 centimeters away from slightly tanned skin at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c51a6016b502d77.jpg", "conversations": [ { "from": "human", "value": "\nLooking at the three people in the foreground of the nightclub scene, can you determine if the checkered fabric sweater at center is positioned to the left or right of the brownsmoothhair at center?" }, { "from": "gpt", "value": "The checkered fabric sweater at center is to the right of brownsmoothhair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/072a991c2ccee346.jpg", "conversations": [ { "from": "human", "value": "\nIs granite gray counter top at center positioned before wooden drawer at lower center?" }, { "from": "gpt", "value": "Yes, granite gray counter top at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d780699c4238b8f6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to walk to the point marked as point (0.704, 0.373). How far is that location from where you are standing?" }, { "from": "gpt", "value": "The distance between the camera and point (0.704, 0.373) is 14.87 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/118d4bb3a6d3e52e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.230, 0.589) less distant than point (0.208, 0.545)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1997449d47807ac8.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the navy blue shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.544, 0.636)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1269a5ae13890f16.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the floral fabric shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.452, 0.641)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6574da3fb5cea372.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte gray jacket at center have a smaller size compared to brown matte sweatshirt at center?" }, { "from": "gpt", "value": "No, matte gray jacket at center is not smaller than brown matte sweatshirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fbb1532f298e006.jpg", "conversations": [ { "from": "human", "value": "\nHow distant is matte nylon jacket at left from clear plastic goggles at upper center?" }, { "from": "gpt", "value": "The distance of matte nylon jacket at left from clear plastic goggles at upper center is 13.78 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7551efbb9befb6df.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.098, 0.530)?" }, { "from": "gpt", "value": "dark gray matte pigeon at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04b3145dcb20095f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper left is positioned to the left of smooth concrete at center?" }, { "from": "gpt", "value": "Correct, you'll find green leafy tree at upper left to the left of smooth concrete at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4be739a32598e3c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the back of the conference room. You need to take a photo of the wooden table at center and the silver metallic microphone at lower center. Which object should you focus on first if you want to capture both in a single shot without moving the camera?" }, { "from": "gpt", "value": "The wooden table at center has a lesser height compared to silver metallic microphone at lower center, so you should focus on the silver metallic microphone at lower center first to ensure both are in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d59dcd54dc7f58c0.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow-green foliage at center have a larger size compared to brown bark tree at center?" }, { "from": "gpt", "value": "Indeed, yellow-green foliage at center has a larger size compared to brown bark tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/779679259a379a49.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position in the park scene. There is a specific point marked at coordinates point (0.736, 0.123). How far is that point from your current position?" }, { "from": "gpt", "value": "The point (0.736, 0.123) is 56.98 feet away from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09974585082b46a6.jpg", "conversations": [ { "from": "human", "value": "\nHow close is satin black headphones at center from camera?" }, { "from": "gpt", "value": "They are 19.38 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6994478b73a6f627.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the pastel striped sweater at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.679, 0.730)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed6187f5722dcd56.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.247, 0.666) come farther from viewer compared to point (0.676, 0.578)?" }, { "from": "gpt", "value": "No, (0.247, 0.666) is in front of (0.676, 0.578)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2f3b5968e40f533.jpg", "conversations": [ { "from": "human", "value": "\nHow far is white matte wing at center from camera?" }, { "from": "gpt", "value": "white matte wing at center and camera are 36.35 inches apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc318f3cc288c413.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center thinner than white fluffy cloud at left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0778b17f5c3bcdd2.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.481, 0.900)?" }, { "from": "gpt", "value": "green grass at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c61276a08c20d3bf.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.453, 0.909) positioned behind point (0.057, 0.648)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9b741d2d9641d72.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is green matte suv at left from camera?" }, { "from": "gpt", "value": "The distance of green matte suv at left from camera is 17.24 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/034b7963ce9c9cdc.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, wooden stairs at center or wooden at center?" }, { "from": "gpt", "value": "wooden at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b737aa6629438de.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, yellow reflective vest at lower right or yellow reflective safety vest at lower right?" }, { "from": "gpt", "value": "yellow reflective safety vest at lower right is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e46de1677bba203.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue water at center have a lesser width compared to blue matte container ship at center?" }, { "from": "gpt", "value": "Indeed, blue water at center has a lesser width compared to blue matte container ship at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad26be278dd0d957.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.218, 0.403) and camera?" }, { "from": "gpt", "value": "They are 1.30 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d73427fd4147e2e.jpg", "conversations": [ { "from": "human", "value": "\nBetween black satin dress at left and gray woolen pants at center, which one has more height?" }, { "from": "gpt", "value": "With more height is black satin dress at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/889ee9825764b159.jpg", "conversations": [ { "from": "human", "value": "\nHow close is brown wood table at center from camera?" }, { "from": "gpt", "value": "They are 30.26 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06ef779d191d8dd2.jpg", "conversations": [ { "from": "human", "value": "\nYou are designing a display stand for a clothing store. The stand has two hangers. The first hanger can hold up to 1.2 kg, and the second can hold up to 1.5 kg. You need to hang the matte red vest at center and the printed cotton robe at left. Which item should go on which hanger to ensure safety?" }, { "from": "gpt", "value": "The matte red vest at center is larger in size than the printed cotton robe at left, so it likely weighs more. To ensure safety, place the matte red vest at center on the second hanger that can hold up to 1.5 kg and the printed cotton robe at left on the first hanger with 1.2 kg capacity." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/edc064d6af6d3710.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if polished brass clock tower at upper center is positioned above white brick clock at center?" }, { "from": "gpt", "value": "Correct, polished brass clock tower at upper center is located above white brick clock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b041bef11130a88e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.388, 0.223) positioned after point (0.144, 0.823)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ced62a7a803fa0c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue fabric beach ball at center is taller than earth-patterned fabric globe at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4c8fe3b1f7440c6.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of matte straw hat at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.523, 0.656)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16a2d5cbc64d7387.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tourist standing on the blue painted metal bridge at left, looking towards the dark blue water at center. Which object is closer to the water surface?" }, { "from": "gpt", "value": "The blue painted metal bridge at left is closer to the water surface than the dark blue water at center because the bridge is positioned over the water, while the water itself is at the lower part of the scene." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/889390c9e2e2cee1.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.425, 0.830) farther from camera compared to point (0.352, 0.713)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4a37a607f0463d7.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a green leafy at center. Pinpoint a point to the green leafy at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.371, 0.520)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49ed6abc43673714.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.142, 0.923) lie behind point (0.385, 0.548)?" }, { "from": "gpt", "value": "No, (0.142, 0.923) is in front of (0.385, 0.548)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7aed6e5fc600861.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.334, 0.695) in front of point (0.268, 0.327)?" }, { "from": "gpt", "value": "No, (0.334, 0.695) is further to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/add5f992fd9147d6.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of blue denim jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.820, 0.700)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6336e2febad77b5e.jpg", "conversations": [ { "from": "human", "value": "\nBetween black plastic keyboard at center and skinny white hand at center, which one is positioned higher?" }, { "from": "gpt", "value": "Positioned higher is skinny white hand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1791fc562bb49e9b.jpg", "conversations": [ { "from": "human", "value": "\nBetween gray concrete sidewalk at center and green plastic bench at lower right, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, gray concrete sidewalk at center appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24730129286454de.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.972, 0.787) and camera?" }, { "from": "gpt", "value": "Point (0.972, 0.787) is 30.16 inches away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74d98affcd29cd03.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any beige canvas tent at center in the image." }, { "from": "gpt", "value": "[(0.857, 0.388)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e7d1889240a6165.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the shiny metallic ornaments at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.365, 0.236)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50a51c47c17f96e6.jpg", "conversations": [ { "from": "human", "value": "\nBetween maroon fabric kurta at center and patterned fabric sari at center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "maroon fabric kurta at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3fee6a51a42f228.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.520, 0.797) or point (0.933, 0.809)?" }, { "from": "gpt", "value": "Point (0.520, 0.797)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c9f7e98f07bc7d9.jpg", "conversations": [ { "from": "human", "value": "\nLocate black leather jacket at lower left in the image." }, { "from": "gpt", "value": "[(0.070, 0.805)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31f0e024ec3b6da6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the rustic porch and want to sit down. Where exactly is the weathered wood bench at left located?" }, { "from": "gpt", "value": "The weathered wood bench at left is located at point (0.338, 0.869)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73dcd7c82d240e3d.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte red minifigure at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.647, 0.352)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca8a07698bec2be8.jpg", "conversations": [ { "from": "human", "value": "\nBetween brown leather horse at center and white leather horse at left, which one is positioned higher?" }, { "from": "gpt", "value": "brown leather horse at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12c9746dbb2fec46.jpg", "conversations": [ { "from": "human", "value": "\nYou are a city planner reviewing a satellite image of a neighborhood. You need to determine if the red tile roof at center is positioned within the central area of the image. Based on the coordinates provided, can you confirm its location?" }, { "from": "gpt", "value": "The red tile roof at center is located at point coordinates of (0.438, 0.914), which places it in the central area of the image as per the given coordinates." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d34bbf5a5f2c188.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from rusty metal table at lower center to camera." }, { "from": "gpt", "value": "rusty metal table at lower center is 2.22 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0007df6c7431789.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.235, 0.827) closer to viewer compared to point (0.300, 0.677)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbae9c46cb22474b.jpg", "conversations": [ { "from": "human", "value": "\nIs rugged brown mountain at upper center positioned at the back of gravelly path at center?" }, { "from": "gpt", "value": "Yes, rugged brown mountain at upper center is behind gravelly path at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40f4ef60914dabba.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of gray checkered shirt at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.077, 0.739)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d419387c0cefdbfa.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.292, 0.716)?" }, { "from": "gpt", "value": "dark gray fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4c5964fb7d441aa.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the weathered wood window at upper right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.735, 0.473)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89413f65c1cfdf34.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.430, 0.589) come closer to viewer compared to point (0.817, 0.617)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c082510d2a6d9223.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to know the distance to the point marked as point (0.012, 0.531). What is the distance in meters?" }, { "from": "gpt", "value": "The point (0.012, 0.531) is 8.43 meters away from the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f35fbf81aa57f8ee.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, matte blue jacket at left or bronze statue at center?" }, { "from": "gpt", "value": "With less height is matte blue jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0e2b0e3757555d9.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of shiny metallic face at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.699, 0.575)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a39e66d608473e44.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between black matte swimsuit at center and camera?" }, { "from": "gpt", "value": "black matte swimsuit at center is 11.07 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/618d40ebc5d4d8e0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a security guard at the event and need to check the distance between the matte black suit at center and the dark gray backpack at left. Can you confirm if the distance is less than 5 feet?" }, { "from": "gpt", "value": "The matte black suit at center is 4.53 feet from the dark gray backpack at left, so yes, the distance is less than 5 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39a480ef92f598e8.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the shopping mall atrium and want to reach the point marked at coordinates (0.451, 0.873). How far is this point from your current position?" }, { "from": "gpt", "value": "The point marked at coordinates (0.451, 0.873) is 58.15 feet away from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eba750fc6d6814ff.jpg", "conversations": [ { "from": "human", "value": "\nHow close is matte black table at center from striped cotton shirt at center?" }, { "from": "gpt", "value": "27.38 inches" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e51e2349dfc66c50.jpg", "conversations": [ { "from": "human", "value": "\nHow far is rusty metal balcony at center from camera?" }, { "from": "gpt", "value": "rusty metal balcony at center is 37.23 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb7dc16166e88027.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.394, 0.552) in front of point (0.547, 0.384)?" }, { "from": "gpt", "value": "Yes, point (0.394, 0.552) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d69b10a40df3d947.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker planning to take a photo of the snowy granite mountains at upper center and the matte green jacket at center. Which object should you focus on first if you want both to be in sharp focus?" }, { "from": "gpt", "value": "The snowy granite mountains at upper center are much taller than the matte green jacket at center, so you should focus on the snowy granite mountains at upper center first to ensure both are in sharp focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01b026c3c6c63b19.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing on the pathway in the scene. You want to take a photo of the floral dress at left and the green grass at lower center. Which object is positioned lower in the frame?" }, { "from": "gpt", "value": "The green grass at lower center is positioned lower than the floral dress at left in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3c6da7febe3eb26.jpg", "conversations": [ { "from": "human", "value": "\nDoes red fleece jacket at right have a greater height compared to white paper at upper left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbfd41d5ba41a891.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.243, 0.588) from camera?" }, { "from": "gpt", "value": "Point (0.243, 0.588) is 14.74 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e51e99d3efcb4ff.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any yellow-green foliage at center in the image." }, { "from": "gpt", "value": "[(0.270, 0.716)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec36c970692be054.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a pink cotton shirt at lower right. Pinpoint a point to the pink cotton shirt at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.873, 0.630)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a25cd29162096033.jpg", "conversations": [ { "from": "human", "value": "\nYou are setting up a new computer and need to connect the black plastic plug at upper right to the black plastic monitor at upper left. The cable you have is 45 centimeters long. Will the cable be long enough to reach?" }, { "from": "gpt", "value": "The distance between the black plastic monitor at upper left and the black plastic plug at upper right is 47.43 centimeters. Since the cable is only 45 centimeters long, it is shorter than the required distance. Therefore, the cable will not be long enough to reach." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30b45c610f7a0dd8.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.320, 0.936) and camera?" }, { "from": "gpt", "value": "Point (0.320, 0.936) is 19.38 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c42c19f3d13bc4ea.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if floral cotton shirt at center is positioned above green rubber rope at center?" }, { "from": "gpt", "value": "Yes, floral cotton shirt at center is above green rubber rope at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7748c1a9a7168bc5.jpg", "conversations": [ { "from": "human", "value": "\nDoes white paper basket at center appear on the left side of yellowish matte chicken at center?" }, { "from": "gpt", "value": "Yes, white paper basket at center is to the left of yellowish matte chicken at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68fe9b0d72223308.jpg", "conversations": [ { "from": "human", "value": "\nYou are a crane operator at the port and need to load cargo from the brown wooden dock at lower left onto the white matte ship at center. The crane has a maximum reach of 50 feet. Can the crane safely reach the ship from the dock?" }, { "from": "gpt", "value": "The white matte ship at center is 53.36 feet away from the brown wooden dock at lower left. Since the crane can only reach 50 feet, it cannot safely reach the ship from the dock." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4850219a19c85795.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of transparent water at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.496, 0.852)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1fa0ff1cd4138c1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a park visitor who wants to sit on a bench that is closer to the shaded area provided by the trees. Which bench should you choose between the dark brown wooden bench at lower right and the wooden bench at lower left?" }, { "from": "gpt", "value": "The dark brown wooden bench at lower right is located above the wooden bench at lower left. Since the shaded area is on the left side with the tall trees, the wooden bench at lower left is closer to the shaded area provided by the trees." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/705eaf8141f575ef.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver who needs to ensure your white matte truck at center can pass under the white metal railing at upper center without hitting it. Based on the scene, can you safely drive the truck under the railing?" }, { "from": "gpt", "value": "The white metal railing at upper center is smaller than the white matte truck at center, so the truck can safely pass under the railing without hitting it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07e79e0ea534d99c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of Maker s Mark Distillery and want to take a photo of the point at coordinates (0.331, 0.939). If your camera has a focal length of 50mm and you are 6.32 meters away from the point, will the point be in focus if the depth of field extends from 5 meters to 7 meters?" }, { "from": "gpt", "value": "The point at coordinates (0.331, 0.939) is 6.32 meters away from the camera. Since the depth of field extends from 5 meters to 7 meters, the point will be within the depth of field and thus in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72db5eaf83b6f7d6.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of clear blue water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.517, 0.753)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af3719e83f68da13.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.204, 0.395) and point (0.517, 0.023), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.517, 0.023) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fab06fd8e7d3b8e7.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the street scene and want to pick up the dark blue fabric at center. How far do you need to walk to reach it?" }, { "from": "gpt", "value": "The dark blue fabric at center is 4.86 meters from the viewer, so you need to walk 4.86 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/003e7a67277201e9.jpg", "conversations": [ { "from": "human", "value": "\nYou are a poultry judge at an exhibition. You need to determine the distance between the white fluffy rooster at center and the black glossy rooster at center. What is the distance between them?" }, { "from": "gpt", "value": "The distance between the white fluffy rooster at center and the black glossy rooster at center is 24.70 inches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/909d803be58b48b8.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the red fabric flag at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.040, 0.537)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1efb4919609c2a7.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of dark blue t-shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.386, 0.294)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5a481c2d8871ebf.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, reddish-brown stone archway at center or dirt path at center?" }, { "from": "gpt", "value": "Positioned to the right is reddish-brown stone archway at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df4449036bcd9a9b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.310, 0.861) or point (0.372, 0.759)?" }, { "from": "gpt", "value": "Point (0.310, 0.861) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/906e02123c5718f8.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black suit at center bigger than dark gray hoodie at right?" }, { "from": "gpt", "value": "Incorrect, matte black suit at center is not larger than dark gray hoodie at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/257c67cf47efb6d8.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte helmet at center appear under shiny metallic skis at left?" }, { "from": "gpt", "value": "Correct, white matte helmet at center is located below shiny metallic skis at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/460efbbf20ee26ef.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.725, 0.178) in front of point (0.915, 0.122)?" }, { "from": "gpt", "value": "Yes, point (0.725, 0.178) is in front of point (0.915, 0.122)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d81dd9b5c2bdfb3.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.637, 0.216) and point (0.389, 0.331), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.637, 0.216) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7e33655796e87bd.jpg", "conversations": [ { "from": "human", "value": "\nYou are a referee standing at the point where the image was taken. You need to measure the distance between yourself and the point marked as point (0.533, 0.777). What is the distance?" }, { "from": "gpt", "value": "The distance between the viewer and point (0.533, 0.777) is 5.93 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d81fd4fa923665a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte orange jersey at center is positioned to the right of white plastic goal post at right?" }, { "from": "gpt", "value": "In fact, matte orange jersey at center is to the left of white plastic goal post at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/369b94187b3f734c.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.299, 0.100) come behind point (0.540, 0.227)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/027052c01187f49e.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue shirt at left appear on the left side of pink matte shirt at center?" }, { "from": "gpt", "value": "Correct, you'll find blue shirt at left to the left of pink matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8c243c559d6a700.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a closeup of the two people in the scene. You notice both the matte black sunglasses at center and the matte black sunglasses at upper center. Which pair of sunglasses is positioned higher up in the image?" }, { "from": "gpt", "value": "The matte black sunglasses at upper center is positioned higher up in the image than the matte black sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/314c751002da1a54.jpg", "conversations": [ { "from": "human", "value": "\nLocate the blue water at center in the image." }, { "from": "gpt", "value": "[(0.514, 0.841)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3e3616204b68484.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.440, 0.580) lie behind point (0.899, 0.791)?" }, { "from": "gpt", "value": "No, (0.440, 0.580) is in front of (0.899, 0.791)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60210de4c1a50108.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte black snowboarder at upper center and black plastic goggles at upper left, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "black plastic goggles at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ab373dfc9b889a1.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.538, 0.692) or (0.679, 0.219)?" }, { "from": "gpt", "value": "Point (0.679, 0.219)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b266eefaa296cbb.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to deliver a package to the MacBook laptop. The package is too large to fit through the door. You need to place it precisely on the point at coordinates point (0.074, 0.111). If you are standing at the MacBook laptop, how far do you need to move the package to reach that point?" }, { "from": "gpt", "value": "The distance between the MacBook laptop and the point (0.074, 0.111) is 3.53 feet. Therefore, you need to move the package 3.53 feet to reach the specified point." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03cac400ee2ce372.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.468, 0.711)?" }, { "from": "gpt", "value": "natural stone patio at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2e3ec3cbef6895a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if stone wall at center is smaller than polished brass lamp post at center?" }, { "from": "gpt", "value": "No, stone wall at center is not smaller than polished brass lamp post at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec4887240ace195e.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.013, 0.264) from camera?" }, { "from": "gpt", "value": "Point (0.013, 0.264) and camera are 4.50 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f365a3bd2e80b3ad.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the base of the ski slope and see the orange fabric ski suit at center. How far away is it from you?" }, { "from": "gpt", "value": "The orange fabric ski suit at center is 30.01 meters away from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00342dbcfa931395.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, matte black vest at center or red plaid kilt at center?" }, { "from": "gpt", "value": "Positioned higher is matte black vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47598331d8a40141.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue t-shirt at center lie behind white cotton shirt at center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f972fa7af6259d93.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.720, 0.573)?" }, { "from": "gpt", "value": "black glossy laptop at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/057e0a7bdbc1bad0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.538, 0.637)?" }, { "from": "gpt", "value": "pink striped jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4317b8d695fdceb6.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of smooth concrete pavement at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.529, 0.739)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f90b560767525e6c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at lower center is positioned to the right of gray fabric tent at lower center?" }, { "from": "gpt", "value": "No, green grass at lower center is not to the right of gray fabric tent at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbf99f085e488c60.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked by the coordinates point (0.488, 0.919) in the image. What is the color of the ground under your feet?" }, { "from": "gpt", "value": "The point (0.488, 0.919) marks green grass at lower center, so the ground under your feet is green grass." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bb1862dd2b1f19f.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a black suit at center. Pinpoint a point to the black suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.750, 0.700)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25d738bd7d948662.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of earthenware bowl at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.692, 0.805)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/646e6c32fd996025.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte paper poster at right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.882, 0.511)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e097c0a8fdf1ee3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, smooth gray roof at center or green leafy hillside at left?" }, { "from": "gpt", "value": "Positioned to the left is green leafy hillside at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9561d1cbf5783143.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green grass at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.492, 0.802)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/085c15401f705ebb.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.128, 0.097)?" }, { "from": "gpt", "value": "black cotton hoodie at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cfb707ffd97606a.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.886, 0.394) from camera?" }, { "from": "gpt", "value": "Point (0.886, 0.394) is 20.29 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70bd728e9e8d52dc.jpg", "conversations": [ { "from": "human", "value": "\nLocate white concrete western auto at center in the image." }, { "from": "gpt", "value": "[(0.730, 0.550)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ec0c982ae15b72b.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.521, 0.544) behind point (0.082, 0.392)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21dc9c49d147a3f3.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of black matte table at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.556, 0.875)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5182d2cc74728ca2.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the vibrant orange petals at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.295, 0.470)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/521857a8835e33d5.jpg", "conversations": [ { "from": "human", "value": "\nLocate white fabric sail at upper right in the image." }, { "from": "gpt", "value": "[(0.828, 0.634)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9464927ad47afa9d.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the matte black helicopter at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.247, 0.408)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ade64aa9ae1520ad.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of metallic gray chair at lower left in the image." }, { "from": "gpt", "value": "[(0.036, 0.908)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7afc9f598fe01f6b.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny metallic train at upper right below yellow plastic track at bottom left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4734e21e07dc7ef0.jpg", "conversations": [ { "from": "human", "value": "\nIs white fabric sandals at upper center behind white cotton pants at upper center?" }, { "from": "gpt", "value": "No, it is in front of white cotton pants at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ff2ee1774a35d57.jpg", "conversations": [ { "from": "human", "value": "\nPoint to rustic stone mountain at upper left.Point to the rustic stone mountain at upper left in the image." }, { "from": "gpt", "value": "[(0.518, 0.123)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2d4e505f41cf6ac.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, matte purple shirt at upper center or matte skin hand at upper center?" }, { "from": "gpt", "value": "matte purple shirt at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/018a84122a882fd5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper center is shorter than brown rock stream at center?" }, { "from": "gpt", "value": "Incorrect, green leafy tree at upper center's height does not fall short of brown rock stream at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b67727aed0a82e6.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.872, 0.014) and camera?" }, { "from": "gpt", "value": "The distance of point (0.872, 0.014) from camera is 3.37 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d828aec103c24fc.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from green cotton shirt at lower right to brown leather jacket at lower left." }, { "from": "gpt", "value": "26.15 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85c09bd944e49c62.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the front porch of the house and want to place the light brown wooden chair at center in front of the white louvered shutter at center. Is there enough space for the chair to fit without overlapping the shutter?" }, { "from": "gpt", "value": "The white louvered shutter at center might be wider than the light brown wooden chair at center, so there might be enough space for the chair to fit without overlapping the shutter, but it depends on the exact dimensions." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fae05568e4323be7.jpg", "conversations": [ { "from": "human", "value": "\nBetween straw hat at center and dark blue jeans at left, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "Positioned to the right is straw hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d34a651525c956f4.jpg", "conversations": [ { "from": "human", "value": "\nIs black fabric banner at center to the left of white plastic pole at upper right from the viewer's perspective?" }, { "from": "gpt", "value": "Yes, black fabric banner at center is to the left of white plastic pole at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/841c08e82aa6c97b.jpg", "conversations": [ { "from": "human", "value": "\nWhere is smooth skin girl at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.362, 0.566)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bba806e9ee3f78b.jpg", "conversations": [ { "from": "human", "value": "\nYou are a military observer assessing the boarding operation. You notice the blue hard hat at center and the matte black rifle at center. Which object is positioned lower in the scene?" }, { "from": "gpt", "value": "The blue hard hat at center is located below the matte black rifle at center, so it is positioned lower in the scene." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38e38385409deeea.jpg", "conversations": [ { "from": "human", "value": "\nLocate shiny green apples at center in the image." }, { "from": "gpt", "value": "[(0.500, 0.509)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7c1ac06c3c2330f.jpg", "conversations": [ { "from": "human", "value": "\nIs green cotton t-shirt at center smaller than fuzzy fabric couch at lower left?" }, { "from": "gpt", "value": "No, green cotton t-shirt at center is not smaller than fuzzy fabric couch at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe176e6b9e07d0dd.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at right have a smaller size compared to green leafy tree at center?" }, { "from": "gpt", "value": "Correct, green leafy tree at right occupies less space than green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c64f297d3aa56348.jpg", "conversations": [ { "from": "human", "value": "\nLocate the silver metallic wing at upper center in the image." }, { "from": "gpt", "value": "[(0.329, 0.417)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9e3b3aab6281dce.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the distance between transparent glass building at center and matte white van at lower left?" }, { "from": "gpt", "value": "A distance of 113.80 meters exists between transparent glass building at center and matte white van at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0113f75bf5fb3e3a.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of glossy maroon car at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.104, 0.467)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65f176a5c9a9bc6c.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny blue skirt at center bigger than fringed blue fabric skirt at center?" }, { "from": "gpt", "value": "Yes, shiny blue skirt at center is bigger than fringed blue fabric skirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6418b7d1a5d3ea9d.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of pink fabric shirt at lower left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.151, 0.866)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6144551712fa2af0.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.774, 0.353) and point (0.397, 0.933), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.397, 0.933)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbb1a1046734bab9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blonde hair at lower center is thinner than dark brown leather jacket at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb185333e1d6dc9a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a guest at this pool party and want to take a photo of the smooth skin man at center without including the green leafy hedge at upper center in the frame. How should you adjust your camera angle?" }, { "from": "gpt", "value": "To exclude the green leafy hedge at upper center from the photo, lower your camera angle so that the hedge is out of view while keeping the smooth skin man at center in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32bac89353e0678e.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.459, 0.453) and point (0.782, 0.548), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.782, 0.548)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d43d02d4abc85377.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the rustic kitchen and want to place a small plant between the two points, point (0.266, 0.241) and point (0.662, 0.255). Can you determine which point is closer to you so you can place the plant in front of it?" }, { "from": "gpt", "value": "Point (0.266, 0.241) is in front of point (0.662, 0.255), so you should place the plant in front of point (0.266, 0.241)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2360e8e989cf748.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a portrait in this scene. You need to ensure that the white lace dress at left and the smooth beige suit at center are both visible in the frame. Given their height difference, which object should you adjust the camera angle to focus on to capture both effectively?" }, { "from": "gpt", "value": "The white lace dress at left is shorter than the smooth beige suit at center. To capture both effectively, lower the camera angle slightly to ensure the shorter white lace dress at left is fully visible while still including the taller smooth beige suit at center in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd33e52c90979bd4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tour guide leading a group to the fuel shed located near the center. You see the white matte boat at lower right and the green matte boat at center. Can you tell the group the distance between these two boats?" }, { "from": "gpt", "value": "The distance between the white matte boat at lower right and the green matte boat at center is 18.48 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/641a97336e53b644.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the concert and want to capture a photo of the black silhouettes at lower center. The stage is divided into sections with coordinates. The point where you need to focus is at point (0.487, 0.880). Can you confirm if the black silhouettes at lower center is located at that coordinate?" }, { "from": "gpt", "value": "Yes, the black silhouettes at lower center is located at point (0.487, 0.880), so you can focus there to capture the photo." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61952456648f0295.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte t-shirt at center is shorter than clear glass at right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7c75b7a069b9732.jpg", "conversations": [ { "from": "human", "value": "\nBetween yellow/blue athletic uniform at center and blue jersey at center, which one has less height?" }, { "from": "gpt", "value": "With less height is blue jersey at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86dc3efef8f2eb06.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the shiny black suv at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.219, 0.842)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/078a02451649f8ce.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a brown leather jacket at upper center. Pinpoint a point to the brown leather jacket at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.458, 0.392)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7db0dbf459b07dc.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.331, 0.802) from camera?" }, { "from": "gpt", "value": "Point (0.331, 0.802) and camera are 57.25 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5158200d5157eba.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.245, 0.783) behind point (0.128, 0.141)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d40f63c26d1764c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up a shot of the workspace. You want to focus on the satin white computer at center. Where should you position your camera relative to the point marked at coordinates (0.628, 0.188)?" }, { "from": "gpt", "value": "The point at coordinates (0.628, 0.188) marks the location of the satin white computer at center, so you should position your camera directly facing this point to focus on it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a292e64de83c310.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark suit at right is bigger than dark fabric dress at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb49b636795a83db.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte bread at center have a greater height compared to golden brown bread at center?" }, { "from": "gpt", "value": "No, white matte bread at center is not taller than golden brown bread at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef71807be0d420f0.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.824, 0.433)." }, { "from": "gpt", "value": "rugged stone mountain at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f2d08ca73fe8d76.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at a point 50.90 meters away from the historic stone church. If you look directly at the point labeled point (0.339, 0.470), which part of the church would you be focusing on?" }, { "from": "gpt", "value": "The point labeled point (0.339, 0.470) is located at the central entrance of the historic stone church, so you would be focusing on the central entrance." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7cfff4b1b610355.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray concrete pillar at center appear over smooth concrete pillar at center?" }, { "from": "gpt", "value": "Yes, gray concrete pillar at center is above smooth concrete pillar at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a487a9c11aba0f00.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian walking on the sidewalk and see the dark brown leather jacket at center and the black rubber scooter at center. Which object is nearer to you?" }, { "from": "gpt", "value": "The dark brown leather jacket at center is closer to the viewer than the black rubber scooter at center, so the dark brown leather jacket at center is nearer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bf27491153d2421.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown dirt path at center appear on the left side of matte black backpack at center?" }, { "from": "gpt", "value": "No, brown dirt path at center is not to the left of matte black backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8926a28cdde6f074.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of black matte suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.789, 0.473)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a7b2b2d6105a7ff.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white floral bouquet at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.697, 0.419)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9206746906eaef8.jpg", "conversations": [ { "from": "human", "value": "\nDoes translucent pinkish-purple figure at center have a greater width compared to green leafy palm tree at left?" }, { "from": "gpt", "value": "Correct, the width of translucent pinkish-purple figure at center exceeds that of green leafy palm tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4471bb27cebb64f8.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.904, 0.328) and point (0.212, 0.505), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.212, 0.505) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11ae4d5843de7a5f.jpg", "conversations": [ { "from": "human", "value": "\nDoes black rubber view mirror at upper right have a lesser height compared to shiny blue sedan at center?" }, { "from": "gpt", "value": "No, black rubber view mirror at upper right is not shorter than shiny blue sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7293b83ab9463eeb.jpg", "conversations": [ { "from": "human", "value": "\nBetween black glass bottles at upper right and clear plastic bottle at center, which one is positioned lower?" }, { "from": "gpt", "value": "clear plastic bottle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/361fdcb033a0afb5.jpg", "conversations": [ { "from": "human", "value": "\nYou are at a social event and want to approach the dark blue suit at right and the white textured shirt at center. Based on their positions, which one would you need to walk around first to reach both?" }, { "from": "gpt", "value": "The dark blue suit at right is below the white textured shirt at center, so you would need to approach the white textured shirt at center first before reaching the dark blue suit at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc9ad5b8c5721c23.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.249, 0.809) or (0.891, 0.364)?" }, { "from": "gpt", "value": "Point (0.249, 0.809) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ebb0d9d4071061e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.727, 0.703) in the gallery. You want to walk to the sculpture displayed on the dark pedestal. How far do you need to walk?" }, { "from": "gpt", "value": "You need to walk 4.40 meters to reach the sculpture displayed on the dark pedestal from the point marked as point (0.727, 0.703)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28cff63b4baf0288.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if strawhat at center is thinner than multicolored woven sombrero at left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c170173c547d6b16.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if purple matte flowers at upper right is positioned to the right of green mossy stone path at center?" }, { "from": "gpt", "value": "Indeed, purple matte flowers at upper right is positioned on the right side of green mossy stone path at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5245f56cd6fb047.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.577, 0.566) to camera." }, { "from": "gpt", "value": "A distance of 17.22 inches exists between point (0.577, 0.566) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4c2aff7229f6e84.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, black matte iphone box at center or matte black iphone at center?" }, { "from": "gpt", "value": "matte black iphone at center is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcbd5c7940e11b14.jpg", "conversations": [ { "from": "human", "value": "\nIs brown textured root at center to the right of green grass at center from the viewer's perspective?" }, { "from": "gpt", "value": "No, brown textured root at center is not to the right of green grass at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69c352134527bb71.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.490, 0.463) or point (0.353, 0.667)?" }, { "from": "gpt", "value": "The point (0.353, 0.667) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ccb2640aac84c9d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray gravel at center is positioned above white cotton robe at right?" }, { "from": "gpt", "value": "Incorrect, gray gravel at center is not positioned above white cotton robe at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c89f84da37995942.jpg", "conversations": [ { "from": "human", "value": "\nYou are a security guard at the historic building and need to fit both the dark brown leather jacket at center and the dark brown leather coat at center into a storage locker that is 1 meter wide. Based on their widths, can both items fit side by side?" }, { "from": "gpt", "value": "The dark brown leather jacket at center might be wider than the dark brown leather coat at center. Since the locker is 1 meter wide, it is uncertain if both can fit without overlapping. Check their exact widths before storing." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f54ba54093aec573.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of matte white blouse at center in the image." }, { "from": "gpt", "value": "[(0.674, 0.652)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/faac443558a10595.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.935, 0.645) closer to viewer compared to point (0.298, 0.705)?" }, { "from": "gpt", "value": "No, it is behind (0.298, 0.705)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd6b0d65f26fdcda.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the black matte jacket at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.072, 0.559)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6f774f1e5541905.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the mosaic glass table at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.446, 0.655)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0813c5f9be81380.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.159, 0.920) and want to take a photo of the group of four individuals in the scene. The camera you are using has a focal length of 50mm and a sensor size of 24mm x 36mm. What is the minimum distance you need to move forward or backward to ensure the entire group fits within the camera frame?" }, { "from": "gpt", "value": "To determine the minimum distance required, first calculate the camera sensor dimensions in terms of field of view. With a 50mm focal length and 24mm height sensor, the vertical field of view is approximately 27 degrees. The height of the group in the scene isn" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7830aaf2e202186.jpg", "conversations": [ { "from": "human", "value": "\nIs white woolen goat at center wider than brown fur dog at upper left?" }, { "from": "gpt", "value": "Yes, white woolen goat at center is wider than brown fur dog at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46f945e8f19c17f3.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the building and want to locate the point at coordinates (0.683, 0.094). Based on the scene description, which object is this point located on?" }, { "from": "gpt", "value": "The point at coordinates (0.683, 0.094) is located on the clear glass window at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19208a6e148780c9.jpg", "conversations": [ { "from": "human", "value": "\nYou are at a party and need to decide which shirt to wear. You want something that is not too bulky. Based on the image, which of the following would be a better choice between the brown plaid shirt at right and the pink checkered shirt at center?" }, { "from": "gpt", "value": "The brown plaid shirt at right is thinner than the pink checkered shirt at center, so it would be a better choice if you want something less bulky." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2059201e36bf7d0.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the orange cotton turban at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.114, 0.536)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b31e77baabc3f858.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the metallic silver fence at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.412, 0.275)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d62a7052fd45a4e.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green fuzzy tree at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.564, 0.825)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3180a3ecf232619.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between natural wood fence at center and camera?" }, { "from": "gpt", "value": "They are 8.22 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60d5f2b9283ed593.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.835, 0.475) positioned in front of point (0.846, 0.394)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.846, 0.394)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54b894dcad068ad8.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of matte black top hat at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.241, 0.598)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a045bf0185c43892.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of matte red shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.681, 0.650)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/acb0e04f3275a796.jpg", "conversations": [ { "from": "human", "value": "\nLocate all brown wood log at center in the image." }, { "from": "gpt", "value": "[(0.603, 0.158)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d8a7c91efdafd58.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the maroon jacket at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.552, 0.570)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c75524cb754e767a.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.096, 0.620) to camera." }, { "from": "gpt", "value": "3.85 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfa951df2a4ae775.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of the point labeled with coordinates (0.452, 0.656) in the image?" }, { "from": "gpt", "value": "The point labeled with coordinates (0.452, 0.656) is located on the snowy rock mountain at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10e090b3b0a90c7d.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.545, 0.655)?" }, { "from": "gpt", "value": "beige quilted bed at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83c41864abb788a9.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green leafy trees at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.504, 0.656)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ab4300a34bff380.jpg", "conversations": [ { "from": "human", "value": "\nWhat is located at the point with coordinates (0.499, 0.584) in the image?" }, { "from": "gpt", "value": "The point at (0.499, 0.584) is where the plaid fabric toddler at center is located." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf5fd93b1c752ba8.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white concrete pavement at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.218, 0.847)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bbaa0ca9a6dc22b.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of smooth black paper at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.556, 0.955)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8c162d69f054bb7.jpg", "conversations": [ { "from": "human", "value": "\nIs translucent amber block at center bigger than matte black chocolate bar at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/779f2317d7b56d22.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte shorts at center have a greater height compared to black fabric squat at lower left?" }, { "from": "gpt", "value": "Yes, black matte shorts at center is taller than black fabric squat at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0c3e029054b5dd6.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of green grass at lower center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.476, 0.881)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2232dceb87a40e9f.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow fabric shirt at lower left to the right of matte red shirt at lower left from the viewer's perspective?" }, { "from": "gpt", "value": "Correct, you'll find yellow fabric shirt at lower left to the right of matte red shirt at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b789473173caa7c0.jpg", "conversations": [ { "from": "human", "value": "\nHow far is white zip-up hoodie at upper center from white smooth arm at upper right?" }, { "from": "gpt", "value": "white zip-up hoodie at upper center and white smooth arm at upper right are 30.96 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5448980ab4ba8f5e.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.381, 0.900) or (0.348, 0.855)?" }, { "from": "gpt", "value": "Point (0.381, 0.900) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25f5cc3dbe6470b6.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of black glass door at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.677, 0.675)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfed793d41745fb3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper right is shorter than green leafy branch at upper left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58fc70c2a706d4eb.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, gray soft shirt at center or black checkered flag at left?" }, { "from": "gpt", "value": "Positioned to the left is black checkered flag at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d9314f79fbcbbd7.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the base of the white stone bell tower at upper center and want to see over the black wrought iron railing at center to view the plaques behind. Can you see over the railing?" }, { "from": "gpt", "value": "The black wrought iron railing at center is shorter than the white stone bell tower at upper center, so yes, you can see over the black wrought iron railing at center from the base of the white stone bell tower at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b69c2ebc1954d83.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.788, 0.991) farther from camera compared to point (0.701, 0.600)?" }, { "from": "gpt", "value": "No, (0.788, 0.991) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4af6a299c1ee0b1f.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.080, 0.819) from camera?" }, { "from": "gpt", "value": "A distance of 36.91 inches exists between point (0.080, 0.819) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/acaadc18a6e7154a.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the black matte curtain at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.864, 0.423)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/214161d43b010649.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray rocky mountain range at center have a greater width compared to white matte moon at center?" }, { "from": "gpt", "value": "Correct, the width of dark gray rocky mountain range at center exceeds that of white matte moon at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99a82fb077637ee6.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.416, 0.458) or point (0.435, 0.553)?" }, { "from": "gpt", "value": "Positioned in front is point (0.416, 0.458)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/468bb2f4567ab2f3.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the silhouette leafy tree at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.388, 0.891)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da8d60b966e155d6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the yellow and white striped wall with a gate. There is a point at coordinates (0.542, 0.830) in the scene. If you want to reach that point, how far do you need to walk?" }, { "from": "gpt", "value": "The distance of point (0.542, 0.830) from the camera is 6.43 meters, so you need to walk 6.43 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3255ec8275b2afe1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker carrying a red woven basket at center and a smooth gray rock at center. You need to place them in order from left to right. Which object should be placed first?" }, { "from": "gpt", "value": "The smooth gray rock at center should be placed first because the red woven basket at center is positioned on the right side of it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36b42610f4e93ddd.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.445, 0.942) farther from viewer compared to point (0.683, 0.233)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3c492baa9f4257f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and see the smooth red robe at right. If you want to reach out and touch it, will your hand be able to reach it without moving your body?" }, { "from": "gpt", "value": "The smooth red robe at right is 28.95 inches away from the camera, so yes, your hand can reach it without moving your body since the average human arm length is about 27 inches, but considering the robe is slightly further, you might need to stretch a bit. However, since it is within arm reach, it is possible." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68c134d13590fa52.jpg", "conversations": [ { "from": "human", "value": "\nIs glossy plastic computer screen at upper center above white plastic keyboard at center?" }, { "from": "gpt", "value": "Indeed, glossy plastic computer screen at upper center is positioned over white plastic keyboard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1c0f43119466e9c.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.585, 0.692) or (0.675, 0.623)?" }, { "from": "gpt", "value": "Point (0.585, 0.692)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fc3b47eeae9f728.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.018, 0.870) on the map. You want to take a photo of the coastal landscape. How far do you need to walk to reach the camera position to capture the scene?" }, { "from": "gpt", "value": "You need to walk 6.30 meters from point (0.018, 0.870) to reach the camera position to capture the coastal landscape." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/086ea7437cc43e4c.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the glossy black car at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.498, 0.881)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd058e52fe5204e2.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.770, 0.630) and point (0.577, 0.303), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.770, 0.630)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/337645240cb99f26.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white smooth lab coat at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.319, 0.594)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58cdea9e63e3b605.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.574, 0.359) and camera." }, { "from": "gpt", "value": "Point (0.574, 0.359) and camera are 13.09 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/277342af5fb4361b.jpg", "conversations": [ { "from": "human", "value": "\nLocate grassy textured patch at center in the image." }, { "from": "gpt", "value": "[(0.280, 0.659)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f0727a2ef99fb93.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect evaluating the structural integrity of the building. You notice the dark glass window at upper center and the wooden window at center. Which window has a smaller width?" }, { "from": "gpt", "value": "The dark glass window at upper center has a lesser width compared to the wooden window at center, so the dark glass window at upper center is smaller in width." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0f3b140df4e6d93.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.344, 0.305) positioned behind point (0.744, 0.003)?" }, { "from": "gpt", "value": "No, (0.344, 0.305) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d277c9d92656c842.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.926, 0.155) and camera?" }, { "from": "gpt", "value": "Point (0.926, 0.155) is 172.64 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0053297fc71ddfa.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.589, 0.942) or point (0.999, 0.922)?" }, { "from": "gpt", "value": "Positioned behind is point (0.589, 0.942)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b94fff7025cac192.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green glass traffic light at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.155, 0.720)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3eec3d415466ff3.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green leafy plant at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.675, 0.117)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4b03f9677105766.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a clear shot of both the green waterproof jacket at center and the blue reflective goggles at center. Since you want to ensure both are in focus, you need to know which object is wider. Can you tell me which one is wider?" }, { "from": "gpt", "value": "The green waterproof jacket at center is wider than the blue reflective goggles at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0887608b7af53626.jpg", "conversations": [ { "from": "human", "value": "\nYou are a gardener who needs to water the green grass at center and the white matte dog at center. Your watering can holds enough water for 5 meters of travel. Can you water both without refilling?" }, { "from": "gpt", "value": "The green grass at center and white matte dog at center are 7.62 meters apart from each other. Since the watering can only allows for 5 meters of travel, you cannot water both without refilling." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22a748887535323f.jpg", "conversations": [ { "from": "human", "value": "\nLocate all multicolored costumes at center in the image." }, { "from": "gpt", "value": "[(0.876, 0.778)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e59d61cd4beb5c03.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, yellow matte shirt at lower left or denim jacket at center?" }, { "from": "gpt", "value": "denim jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58460225071356ae.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of matte black coat at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.732, 0.466)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66fa33bfa940c8ff.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture both the shiny black umbrella at lower center and the matte pink umbrella at center in a single shot. Based on their positions, which umbrella will appear larger in the photo?" }, { "from": "gpt", "value": "The shiny black umbrella at lower center will appear larger in the photo because it is closer to the camera than the matte pink umbrella at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20dee1754c6d2e33.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the black matte shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.837, 0.588)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad649fde229ca156.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach point (0.811, 0.013). How far do you need to walk?" }, { "from": "gpt", "value": "You need to walk 7.71 feet to reach point (0.811, 0.013) from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0672eefdbcbb3d01.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of soft gray sweater at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.235, 0.664)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f8f7add9adebcc4.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the bottom of the grand staircase in the historic building. You notice a blurred beige shirt at right near the point marked at coordinates (0.846, 0.695). Can you see the person wearing the shirt clearly?" }, { "from": "gpt", "value": "The blurred beige shirt at right is located at point (0.846, 0.695), which is described as blurred, so the person wearing it cannot be seen clearly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ec322155d6740ab.jpg", "conversations": [ { "from": "human", "value": "\nWhere is light beige shirt at left located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.092, 0.487)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8406f4bfff10c5e7.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center have a larger size compared to brick stonework bell tower at center?" }, { "from": "gpt", "value": "No, green grass at center is not bigger than brick stonework bell tower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a31244827915a58.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the golden mosaic temple at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.115, 0.269)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a5f308725a2d45b.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white cotton shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.376, 0.661)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/caab7eb965069336.jpg", "conversations": [ { "from": "human", "value": "\nBetween brown muddy water at lower center and orange life vest at lower right, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, orange life vest at lower right appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00495759b6bb49c3.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.561, 0.542) or (0.880, 0.909)?" }, { "from": "gpt", "value": "Point (0.561, 0.542)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b712fb05804025f5.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red dress at upper right have a smaller size compared to smooth gray shirt at upper right?" }, { "from": "gpt", "value": "No, matte red dress at upper right is not smaller than smooth gray shirt at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c956d050ff7d8a36.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tailor who needs to determine which item is shorter between the green matte shirt at center and the matte skin boy at center. Which one should you choose?" }, { "from": "gpt", "value": "The green matte shirt at center is not as tall as the matte skin boy at center, so the green matte shirt at center is shorter and should be chosen." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3db324d16f418b7.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the edge of the forest, and you want to take a photo of the black glossy table at center and the blue fabric shirt at left. Based on their positions, can you tell which object is closer to you?" }, { "from": "gpt", "value": "The blue fabric shirt at left is closer to you because the black glossy table at center is positioned under it, meaning the shirt is above and nearer to your viewpoint." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e667a1e15a71f2d.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green leafy tree at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.111, 0.608)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62e5c51a974b9821.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the coastal scene and want to walk from the green leafy tree at upper center to the green metal fence at lower center. How far do you need to walk in feet?" }, { "from": "gpt", "value": "The green leafy tree at upper center is 5.48 feet away from the green metal fence at lower center, so you need to walk 5.48 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39a5d1189b374ed6.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.114, 0.539) and camera?" }, { "from": "gpt", "value": "Point (0.114, 0.539) is 20.53 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4031fc78d7128765.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, matte black jacket at center or khaki textured trench coat at center?" }, { "from": "gpt", "value": "Positioned to the right is khaki textured trench coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a8b5935f82509b8.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the blue denim jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.648, 0.714)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0cec8732e1302c57.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the white matte plate at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.748, 0.678)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3642f093deb8228b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, brown matte eyebrow at upper center or matte brown eyebrow at upper center?" }, { "from": "gpt", "value": "Positioned to the right is matte brown eyebrow at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62343babe7605a39.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, orange matte tree at center or green matte tree at center?" }, { "from": "gpt", "value": "orange matte tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1df6e24490974c65.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between white fabric at center and camera?" }, { "from": "gpt", "value": "5.81 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18efb26a981b8c21.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.198, 0.309) and camera?" }, { "from": "gpt", "value": "They are 9.45 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8b80fc829dbe395.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the scene of a building collapse. There is a point marked at coordinates point (0.869, 0.750). If you want to safely observe the structural damage without crossing the red and white striped barrier tape, can you see the point from your current position?" }, { "from": "gpt", "value": "The point (0.869, 0.750) is 11.91 meters from viewer, so yes, you can see the point from your current position as it is within visible range and not obstructed by the barrier tape." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/443c032d7990d59a.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of black suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.312, 0.261)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c9288f2c436a6b3.jpg", "conversations": [ { "from": "human", "value": "\nIs neon yellow vest at center to the right of white plastic pole at lower left from the viewer's perspective?" }, { "from": "gpt", "value": "Yes, neon yellow vest at center is to the right of white plastic pole at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28b740c8a9cf9ebf.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.247, 0.675) in the image. What item is located exactly at that point?" }, { "from": "gpt", "value": "The yellow cotton shorts at center are located exactly at point (0.247, 0.675)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/193e715ddeafdcf2.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, white stone relief at center or white stone writing at center?" }, { "from": "gpt", "value": "white stone relief at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/466a81415e6c2fbb.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the brown furry deer at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.846, 0.700)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e9a1877aa9c42bc.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of this grand space and want to walk towards the red carpet at the top of the stairs. Which direction should you move relative to the point marked at coordinate point (0.684, 0.647)?" }, { "from": "gpt", "value": "The point marked at coordinate point (0.684, 0.647) corresponds to the polished marble stairs at center. To reach the red carpet at the top of the stairs, you should move upwards from this point." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14420f24b717f0dc.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between gray matte t-shirt at left and camera." }, { "from": "gpt", "value": "A distance of 26.41 inches exists between gray matte t-shirt at left and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc8a6faaf2d61ee3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if translucent plastic bowl at center is positioned above white powdery flour at right?" }, { "from": "gpt", "value": "Indeed, translucent plastic bowl at center is positioned over white powdery flour at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d992c427b13ccee0.jpg", "conversations": [ { "from": "human", "value": "\nYou are an event organizer and need to ensure that both the matte black monitor at center and the black matte microphone at center are visible to the audience. Given their positions and sizes, which object might require adjustment to ensure it doesn not block the other?" }, { "from": "gpt", "value": "The matte black monitor at center is wider than the black matte microphone at center. Since the monitor is wider, it might be blocking the microphone from the audience perspective, so adjusting the microphone position could help ensure both are visible." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1c7f85671e132c9.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green leafy tree at right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.905, 0.388)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a544d94f3cf8c7cc.jpg", "conversations": [ { "from": "human", "value": "\nYou are a soccer coach analyzing a match. You notice the red matte jersey at center and the light blue jersey at center. Based on their positions, do you think they can communicate effectively with a standard whistle sound? Assume the whistle can be heard up to 40 feet." }, { "from": "gpt", "value": "The distance between the red matte jersey at center and light blue jersey at center is 33.68 feet, which is within the whistle range of 40 feet. Therefore, they can communicate effectively using a standard whistle sound." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8710a3c84d5c6e24.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the bottom of the staircase and want to reach the top. There are two points marked on the staircase. One is at point (0.800, 0.356) and the other is at point (0.233, 0.242). Which point should you step on first to ascend the staircase?" }, { "from": "gpt", "value": "You should step on point (0.800, 0.356) first because it is closer to the camera, meaning it is lower on the staircase and part of the first steps you would take when ascending." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e0676afc196e0ee.jpg", "conversations": [ { "from": "human", "value": "\nDoes green metallic sign at center have a smaller size compared to green matte sign at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34efa3edb638637a.jpg", "conversations": [ { "from": "human", "value": "\nIs fuzzy brown coat at center closer to the viewer compared to pink glossy meat at lower left?" }, { "from": "gpt", "value": "No, fuzzy brown coat at center is behind pink glossy meat at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f214d03f4b3f25e.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.380, 0.994) come closer to viewer compared to point (0.570, 0.306)?" }, { "from": "gpt", "value": "Yes, point (0.380, 0.994) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c0b04e45015ffd2.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the pink fabric scrub at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.885, 0.870)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eacf461fd40a20d0.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden raft at center shorter than matte yellow raft at lower left?" }, { "from": "gpt", "value": "No, wooden raft at center is not shorter than matte yellow raft at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3108b5ff38e7eea5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the perfect shot of the black and tan fur dog at center and the white fluffy snow at center. Based on their positions, which object is higher in the image?" }, { "from": "gpt", "value": "The white fluffy snow at center is much taller than the black and tan fur dog at center, so the white fluffy snow at center is higher in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08542fce10affb89.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, matte red shirt at lower left or white textured shirt at center?" }, { "from": "gpt", "value": "With less height is matte red shirt at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea3abae1038be6c3.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.252, 0.647) less distant than point (0.398, 0.412)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/905a05e73adb90a0.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow matte trailer truck at center come in front of black plastic license plate at center?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db9fc6a18c4babef.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a blue and white ceramic bowl at center. Pinpoint a point to the blue and white ceramic bowl at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.495, 0.561)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27ea5c6bfa540df5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a passenger on a moving train and want to know if you can fully see the jacket and window from your seat. The jacket is part of the same clothing as the hoodie mentioned in the scene. Are both the gray fleece jacket at upper right and the transparent glass window at upper left visible in their entirety from your current seat?" }, { "from": "gpt", "value": "The gray fleece jacket at upper right is shorter than the transparent glass window at upper left, so the jacket is shorter and might be fully visible, but the window is taller and could be partially obscured depending on your seat angle. However, since the jacket is shorter, it is more likely both are visible entirely." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7b75d96ad32549f.jpg", "conversations": [ { "from": "human", "value": "\nWhere is denim jacket at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.774, 0.625)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbedd12f9149cb7a.jpg", "conversations": [ { "from": "human", "value": "\nCould you provide the distance between matte black field camera at center and metallic silver enlarger at lower right?" }, { "from": "gpt", "value": "A distance of 44.32 centimeters exists between matte black field camera at center and metallic silver enlarger at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f65cd920309b1b0a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer using a camera with a minimum focusing distance of 40 centimeters. You want to take a closeup photo of the smooth skin face at center. Can you focus on it?" }, { "from": "gpt", "value": "The smooth skin face at center and viewer are 43.72 centimeters apart, so yes, the photographer can focus on it since the distance is greater than the camera minimum focusing distance of 40 centimeters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73c235bda06c1528.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, blue fabric table at center or matte plastic book at center, stands taller?" }, { "from": "gpt", "value": "With more height is blue fabric table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/667441da06b28114.jpg", "conversations": [ { "from": "human", "value": "\nLocate the white powdery snow at lower center in the image." }, { "from": "gpt", "value": "[(0.494, 0.977)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea4ddb601cb8a793.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.267, 0.197)?" }, { "from": "gpt", "value": "green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ac99100d6b81e23.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at lower center shorter than green forested mountain at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d7cbaaaf5e15937.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.771, 0.492) behind point (0.767, 0.716)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.767, 0.716)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d025da6696848d61.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the classroom and want to determine which of the two points, point (0.570, 0.794) or point (0.499, 0.333), is closer to you. Based on the image, which point is nearer?" }, { "from": "gpt", "value": "Point (0.570, 0.794) is closer to the camera than point (0.499, 0.333), so it is the nearer point." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ab34c1199a6d63d.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white matte basketball player at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.594, 0.547)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c085bd94d63477f0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker standing at the base of the dark green leafy tree at center. You want to reach the smooth brown hill at right. How far do you need to walk to get there?" }, { "from": "gpt", "value": "The dark green leafy tree at center is 385.71 feet away from the smooth brown hill at right, so you need to walk 385.71 feet to reach the smooth brown hill at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2e6420861f07d3d.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of two flags and a person in formal attire. The flags are the Irish flag on the left and the American flag on the right. Where is the dark gray striped tie at center located in relation to the two flags?" }, { "from": "gpt", "value": "The dark gray striped tie at center is located at the center of the image, between the two flags." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5e1f7258c29305e.jpg", "conversations": [ { "from": "human", "value": "\nHow distant is green leafy tree at center from light gray concrete stairs at center?" }, { "from": "gpt", "value": "37.95 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/472f9023dcff6fdf.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.349, 0.484) positioned in front of point (0.229, 0.581)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.229, 0.581)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dafb30fef1598167.jpg", "conversations": [ { "from": "human", "value": "\nYou are looking at a lock screen on a mobile device. You notice two items displayed on the game show backdrop. The pink fabric tie at right and the gray sweater at left. Which item is positioned higher on the screen?" }, { "from": "gpt", "value": "The pink fabric tie at right is positioned higher on the screen because it is above the gray sweater at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7dab6a7207822444.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy palm tree at center bigger than clear water at center?" }, { "from": "gpt", "value": "No, green leafy palm tree at center is not bigger than clear water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07349dbdb85d9b8c.jpg", "conversations": [ { "from": "human", "value": "\nBetween dark gray cloud at upper center and silvery metallic bird at right, which one is positioned higher?" }, { "from": "gpt", "value": "dark gray cloud at upper center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be8f29f1d763453c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the snow mountain and see the green matte tree at center and the green evergreen tree at right. Which tree is closer to you?" }, { "from": "gpt", "value": "The green matte tree at center is closer to you because the green evergreen tree at right is behind it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/456679e19284bd02.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.433, 0.113) from camera?" }, { "from": "gpt", "value": "Point (0.433, 0.113) is 38.04 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56e40c259d5e3930.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.131, 0.650) positioned in front of point (0.444, 0.567)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88c184b1bba3af7c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.487, 0.994) or point (0.275, 0.370)?" }, { "from": "gpt", "value": "The point (0.275, 0.370) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9fc127be16bf8c6c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the sandy beach at lower right and want to take a photo of the sunset using the black plastic camera at center. Can you reach the camera without moving from your current position?" }, { "from": "gpt", "value": "The sandy beach at lower right is below the black plastic camera at center, so you can reach the camera without moving from your current position since it is above you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/869bc8c1c6218883.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the matte black suit at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.313, 0.669)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed51149ceb90fb1a.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of black polished metal lamp post at right. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.748, 0.350)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bee1f4354591ce2f.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green leafy tree at center more distant than that of green grass at lower center?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ff248ea1f45a422.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cardboard boat at center is smaller than dark blue fabric umbrella at upper right?" }, { "from": "gpt", "value": "Incorrect, white cardboard boat at center is not smaller in size than dark blue fabric umbrella at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18fa27ff1b57d844.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of golden stone tower at upper center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.332, 0.286)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f063a2f9d5200fc.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white satin dress at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.687, 0.661)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b52ae8bbd19fd374.jpg", "conversations": [ { "from": "human", "value": "\nIs blue smooth shirt at center below matte blue shirt at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0816857cf8333414.jpg", "conversations": [ { "from": "human", "value": "\nBetween blue satin suit at center and light blue silk tie at center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "blue satin suit at center is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7bc51c72aca917d9.jpg", "conversations": [ { "from": "human", "value": "\nYou are an attendee at this event and need to locate the person with the white mesh cap at left and the person with the smooth skin head at center. From your perspective, which one is positioned to the right of the other?" }, { "from": "gpt", "value": "The white mesh cap at left is to the right of smooth skin head at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36c878c0b6e1233a.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, white matte car at lower left or matte gray car at left?" }, { "from": "gpt", "value": "Positioned higher is matte gray car at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f40f67b6cf254d9.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tourist standing on the dock looking at the green rocky mountain at center and the dark blue metallic cruise ship at right. Which object is closer to you?" }, { "from": "gpt", "value": "The green rocky mountain at center is closer to you because the dark blue metallic cruise ship at right is behind it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c0f654f04c06733.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.557, 0.742) or (0.312, 0.531)?" }, { "from": "gpt", "value": "The point (0.312, 0.531) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a309f782c6c33330.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, clear water at center or glossy wood bridge at center?" }, { "from": "gpt", "value": "From the viewer's perspective, glossy wood bridge at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bbeac2c5b2a3f09.jpg", "conversations": [ { "from": "human", "value": "\nPoint to dark gray t-shirt at left.Point to the dark gray t-shirt at left in the image." }, { "from": "gpt", "value": "[(0.234, 0.703)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e178da6f24cbbe50.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer adjusting your camera to capture the person in the scene. The matte black glasses at center are positioned at coordinates 0.667 on the x and 0.279 on the y. To ensure the glasses are in focus, should you adjust your focus point to the left or right of their current position?" }, { "from": "gpt", "value": "The matte black glasses at center are already at the specified coordinates, so no adjustment is needed. Keep the focus point where it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a78c6fbe0b6cc5b8.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the office scene described. There is a point at coordinate (0.873, 0.578). What object is located at that point?" }, { "from": "gpt", "value": "The gray striped sweater at center is located at point (0.873, 0.578)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4ee73c8e2c2f92f.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.069, 0.509) or (0.850, 0.692)?" }, { "from": "gpt", "value": "Positioned behind is point (0.850, 0.692)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ffcfb57b443fb6d.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.974, 0.931) or (0.135, 0.270)?" }, { "from": "gpt", "value": "Point (0.974, 0.931)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86ee9060acdd1668.jpg", "conversations": [ { "from": "human", "value": "\nBetween black matte wetsuit at center and matte yellow scuba tank at left, which one is positioned lower?" }, { "from": "gpt", "value": "black matte wetsuit at center is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb92aadc3d5c2e07.jpg", "conversations": [ { "from": "human", "value": "\nYou are an underwater photographer aiming to capture the polka dot yellow fish at center and the smooth rock at center in the same frame. Based on their positions, which object should you adjust your camera to focus on first to ensure both are in the shot?" }, { "from": "gpt", "value": "The smooth rock at center is to the right of the polka dot yellow fish at center, so you should focus on the polka dot yellow fish at center first to ensure both are captured in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9fc903282adfb218.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a clear shot of both the pink plastic water bottle at center and the gray rough rock at lower left. Based on their positions, which object will appear larger in the photo?" }, { "from": "gpt", "value": "The pink plastic water bottle at center will appear larger in the photo because it is closer to the viewer than the gray rough rock at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a142430099dccb53.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at a wedding ceremony. You need to adjust the camera focus to capture both the pearl lace dress at center and the clear crystal tiara at center. Which object should you focus on first if you want to ensure the taller one is in focus?" }, { "from": "gpt", "value": "The clear crystal tiara at center is taller than the pearl lace dress at center, so you should focus on the clear crystal tiara at center first to ensure it is in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04d49113cd23b70c.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect evaluating the skyline of this city. You notice the green glassy tower at center and the green glass skyscraper at upper right. Which of these two structures is taller?" }, { "from": "gpt", "value": "The green glassy tower at center is taller than the green glass skyscraper at upper right according to the description provided." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec1c86511ffe978d.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the start of the dirt path in the coastal scene. You want to reach the green leafy tree at upper right. How far is it from your current position?" }, { "from": "gpt", "value": "The green leafy tree at upper right is 22.69 meters away from the viewer, so it is approximately 22.69 meters away from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df9ab2997508d01a.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown sweater at center appear on the right side of black fabric shirt at center?" }, { "from": "gpt", "value": "Indeed, dark brown sweater at center is positioned on the right side of black fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5123529956b35184.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the matte glass landscape at upper right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.706, 0.362)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a96c3cdf0c5c8fe.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white shirt and tie at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.717, 0.631)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2ba6ce6ea5f9e98.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, rusty metal silo at center or rusty metallic silo at center?" }, { "from": "gpt", "value": "rusty metal silo at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97f449a9f53ea7fb.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing materials for a landscaping project and need to know which item takes up more space. Based on the scene, which occupies more area between the brown dry hay at lower right and the tan fabric shirt at center?" }, { "from": "gpt", "value": "The tan fabric shirt at center occupies more space than the brown dry hay at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7be340a8e580aae.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between green leafy tree at upper center and camera?" }, { "from": "gpt", "value": "green leafy tree at upper center is 36.28 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ac06c12fee8b49a.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of matte pink shirt at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.828, 0.697)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a8b1fbb478f7fe8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to park your white matte van at lower left on the paved concrete sidewalk at lower center. Is there enough space for the van to park there?" }, { "from": "gpt", "value": "The paved concrete sidewalk at lower center is below the white matte van at lower left, which means the van is already parked there. Therefore, there is space for the van to park on the sidewalk." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b85a43ee88ba7949.jpg", "conversations": [ { "from": "human", "value": "\nYou are a passenger waiting on the platform and need to board the train. You see the sleek silver train at left and the dark blue jeans at right. Which one is taller?" }, { "from": "gpt", "value": "The sleek silver train at left is taller than the dark blue jeans at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed3b3e3f831af060.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.294, 0.562) and point (0.359, 0.516), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.294, 0.562) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4348c9f13ecfc065.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the white tank top at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.233, 0.694)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc2a44e9e588cea5.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to set up a picnic table in this outdoor area. Based on the scene, which object would cast a longer shadow at noon? Please consider the green leafy tree at upper center and the brown wooden table at lower right." }, { "from": "gpt", "value": "The green leafy tree at upper center is much taller than the brown wooden table at lower right, so it would cast a longer shadow at noon." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d77e4907c7ec0948.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.500, 0.806) in the image. What type of surface are you standing on?" }, { "from": "gpt", "value": "The asphalt road at center is located at point (0.500, 0.806), so you are standing on asphalt road at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/150eb35621124f49.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth asphalt at center taller than blue metallic motorcycle at lower right?" }, { "from": "gpt", "value": "Incorrect, smooth asphalt at center's height is not larger of blue metallic motorcycle at lower right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76646b764a4184e1.jpg", "conversations": [ { "from": "human", "value": "\nIs ribbed gray sweater at center below brown matte shirt at center?" }, { "from": "gpt", "value": "Incorrect, ribbed gray sweater at center is not positioned below brown matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07d1f85e436bb113.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.181, 0.287)?" }, { "from": "gpt", "value": "matte plastic arrow at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43aa47aaaa2799cd.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.504, 0.294)?" }, { "from": "gpt", "value": "brown rough bark tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/501b2fd042d7cc42.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black jacket at left have a lesser width compared to dark blue leather jacket at center?" }, { "from": "gpt", "value": "In fact, matte black jacket at left might be wider than dark blue leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcc481918419528b.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.958, 0.917) come farther from viewer compared to point (0.719, 0.333)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f6d110db2ce863c.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a green matte net at center. Pinpoint a point to the green matte net at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.707, 0.477)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78482d6f8b45ef92.jpg", "conversations": [ { "from": "human", "value": "\nHow close is green grass field at lower center from camera?" }, { "from": "gpt", "value": "The distance of green grass field at lower center from camera is 16.11 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5352d89aa28c016e.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a navy blue dress at center. Pinpoint a point to the navy blue dress at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.605, 0.598)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36747dc1f9c728c4.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the yellow stone church at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.285, 0.562)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/744c6f578f137617.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, matte blue cushion at center or black glossy cat at center?" }, { "from": "gpt", "value": "From the viewer's perspective, matte blue cushion at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2698afff6e141b2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a bird flying over the scene and want to land on the transparent plastic fence at center. However, there is a green wire tree at upper right nearby. Which object is closer to the ground, allowing you to land safely?" }, { "from": "gpt", "value": "The transparent plastic fence at center is positioned under the green wire tree at upper right, meaning the fence is closer to the ground than the tree. Therefore, you can safely land on the transparent plastic fence at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b85ba932dcd570f1.jpg", "conversations": [ { "from": "human", "value": "\nBetween olive green quilted jacket at center and wooden desk at lower right, which one is positioned higher?" }, { "from": "gpt", "value": "Positioned higher is olive green quilted jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e39fc795fcdc9e65.jpg", "conversations": [ { "from": "human", "value": "\nPoint to black paper sign at right.Point to the black paper sign at right in the image." }, { "from": "gpt", "value": "[(0.813, 0.492)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54328b4fc4befb95.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.288, 0.550) or point (0.727, 0.952)?" }, { "from": "gpt", "value": "Point (0.727, 0.952)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adccb59254960809.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown water at center lie in front of green matte forested mountain at left?" }, { "from": "gpt", "value": "Yes, it is in front of green matte forested mountain at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72b9ec747627b620.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in the middle of the street. You want to take a photo of the monument with both the shiny black sedan at right and the shiny black car at left in the frame. Which car should you position closer to the monument to ensure both vehicles are visible in the photo?" }, { "from": "gpt", "value": "The shiny black car at left should be positioned closer to the monument because the shiny black sedan at right is already on the right side of it, so moving the left car closer would help frame both vehicles within the photo." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4da36ac621b0c1f.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.168, 0.681) come closer to viewer compared to point (0.340, 0.456)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc13a628a2dc2135.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, green striped shirt at center or green leafy fern at left?" }, { "from": "gpt", "value": "green leafy fern at left is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c4d7ac5b35b72c6.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.379, 0.500) and point (0.261, 0.534), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.261, 0.534) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/080668ef3cc13fce.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue cotton shirt at center appear on the left side of printed fabric blouse at upper right?" }, { "from": "gpt", "value": "Correct, you'll find blue cotton shirt at center to the left of printed fabric blouse at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cde7ea2619b1a323.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, white cotton shirt at center or blue cotton shirt at center, stands shorter?" }, { "from": "gpt", "value": "white cotton shirt at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/104205b529f6e356.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.074, 0.552) farther from camera compared to point (0.301, 0.255)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/137a34dfced15f34.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.386, 0.609)?" }, { "from": "gpt", "value": "dark gray feathers at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/559b2b02ab78b611.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte beige blouse at center is positioned to the left of black plastic table at center?" }, { "from": "gpt", "value": "Correct, you'll find matte beige blouse at center to the left of black plastic table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5e597b8eef54000.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown leather jacket at center to the right of leather jacket at lower right from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, dark brown leather jacket at center is not on the right side of leather jacket at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74896d914af56e3f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if striped cotton shirt at center is positioned to the left of matte red vest at center?" }, { "from": "gpt", "value": "Indeed, striped cotton shirt at center is positioned on the left side of matte red vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/705d0ebee577b4ba.jpg", "conversations": [ { "from": "human", "value": "\nHow far is dark brown hair at lower right from camera?" }, { "from": "gpt", "value": "dark brown hair at lower right and camera are 12.53 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9477436d1775b04a.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any camouflage fabric helmet at center in the image." }, { "from": "gpt", "value": "[(0.717, 0.227)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b621cd9499ccb0a.jpg", "conversations": [ { "from": "human", "value": "\nHow close is green leafy tree at center from yellow matte shirt at right?" }, { "from": "gpt", "value": "They are 469.51 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2ba59e4d0418790.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of stained glass window at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.411, 0.261)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/084573c41d29d620.jpg", "conversations": [ { "from": "human", "value": "\nLocate the printed cotton shirt at left in the image." }, { "from": "gpt", "value": "[(0.035, 0.600)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1be4a73713d26838.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.708, 0.700) come farther from viewer compared to point (0.370, 0.909)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0678bff130bd7308.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the kitchen and want to grab a plate from the white ceramic plates at lower left. How far do you need to reach to get one?" }, { "from": "gpt", "value": "The white ceramic plates at lower left are 81.60 centimeters away from the viewer, so you need to reach 81.60 centimeters to get one." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb90c5d608bdba17.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the wooden canoe at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.960, 0.844)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46ca91be0cfd08e9.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to golden fur dog at center? Please provide its 2D coordinates.Where can I find golden fur dog at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.494, 0.267)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0120825a3a2b7b8.jpg", "conversations": [ { "from": "human", "value": "\nIs brown bark tree at left to the right of bare branches at upper center from the viewer's perspective?" }, { "from": "gpt", "value": "No, brown bark tree at left is not to the right of bare branches at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5710d72485cc31f3.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.899, 0.775) or (0.309, 0.572)?" }, { "from": "gpt", "value": "Point (0.899, 0.775) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38d9e3d67d976ef4.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to green grass at center? Please provide its 2D coordinates.Where can I find green grass at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.493, 0.828)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd422f2180e59e46.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.712, 0.448)?" }, { "from": "gpt", "value": "white paper at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55fca5e59f55ce5a.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white cotton shirt at lower center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.632, 0.778)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df5123ffcf19fa20.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist planning to paint the scene. You want to ensure the rustic rock formation at center and the matte blue sweater at center are proportionally accurate. Which object should you make larger in your painting?" }, { "from": "gpt", "value": "The rustic rock formation at center should be depicted as larger than the matte blue sweater at center in the painting since it is described as larger in size according to the scene description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cd4113062a29d56.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.553, 0.956) closer to viewer compared to point (0.441, 0.525)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.441, 0.525)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4364506406356c8.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.696, 0.422) and camera?" }, { "from": "gpt", "value": "Point (0.696, 0.422) and camera are 7.71 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3f7fc333bbdf45a.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.298, 0.761) or (0.208, 0.794)?" }, { "from": "gpt", "value": "Point (0.208, 0.794) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10e090b3b0a90c7d.jpg", "conversations": [ { "from": "human", "value": "\nYou are an interior designer planning to place a new decorative item in the bedroom. You have a small decorative item that needs to fit between the translucent beige curtains at center and the beige fabric lampshade at right. Considering their sizes, which object should you place the item next to to ensure it doesn" }, { "from": "gpt", "value": "The translucent beige curtains at center are larger than the beige fabric lampshade at right, so placing the small decorative item next to the beige fabric lampshade at right would leave enough space for it to fit comfortably." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8728e5e7b2c71577.jpg", "conversations": [ { "from": "human", "value": "\nIs striped fabric shirt at center positioned before chocolate matte cake at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78d925ca57964ff6.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the black plastic keyboard at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.746, 0.672)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01d716aa181a3101.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of brown soil at center in the image." }, { "from": "gpt", "value": "[(0.544, 0.892)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc107c864a962f86.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.240, 0.330)?" }, { "from": "gpt", "value": "rocky gray mountain at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbe4cabd38ec1557.jpg", "conversations": [ { "from": "human", "value": "\nDoes stone clock tower at center appear on the left side of checkered fabric balloon at upper center?" }, { "from": "gpt", "value": "Incorrect, stone clock tower at center is not on the left side of checkered fabric balloon at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25b52c75441454d5.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the ancient Roman site and want to take a photo of the point at coordinates point (0.430, 0.072). Your camera has a maximum focus range of 75 meters. Will you be able to focus on the point?" }, { "from": "gpt", "value": "The point (0.430, 0.072) is 76.06 meters away from the camera, which exceeds the maximum focus range of 75 meters. Therefore, the camera will not be able to focus on the point." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf9eff14266fd5e1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who wants to retrieve your camouflage fabric jacket at left from the rocky area. However, there is a blue fabric kayak at right in your path. Based on their positions, can you reach the jacket without moving the kayak?" }, { "from": "gpt", "value": "The camouflage fabric jacket at left is located below the blue fabric kayak at right, so you can reach the jacket without moving the kayak since it is positioned underneath it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/000d655d579b9b30.jpg", "conversations": [ { "from": "human", "value": "\nIs clear water at center to the left of white foamy wave at lower center from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, clear water at center is positioned on the left side of white foamy wave at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/614ab5e0298ddefd.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at lower center smaller than bare branches at left?" }, { "from": "gpt", "value": "No, green grass at lower center is not smaller than bare branches at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2006a810fbe9eb94.jpg", "conversations": [ { "from": "human", "value": "\nBetween green plastic chair at lower right and white plastic chair at center, which one has more height?" }, { "from": "gpt", "value": "green plastic chair at lower right is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24e7a31fe737e674.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of floral kimono at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.188, 0.655)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e34ac1a5092c7566.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.022, 0.603)?" }, { "from": "gpt", "value": "matte red jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/809c2a765cf9ebf8.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to place a new bench in the garden between the wooden log cabin at center and the polished bronze statue at center. Based on their widths, which object should the bench be closer to ensure it doesn" }, { "from": "gpt", "value": "The wooden log cabin at center might be wider than the polished bronze statue at center, so the bench should be placed closer to the wooden log cabin at center to accommodate its greater width." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00e0fb3264523948.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the light blue fabric person at lower left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.178, 0.703)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb7d4231e15cd843.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.290, 0.408)." }, { "from": "gpt", "value": "smooth wooden post at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e679ed04fed7db2.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing items on a shelf and need to know the height of both the burlap coffee bag at upper left and the blue plastic toothpaste at center right. Which one is taller?" }, { "from": "gpt", "value": "The burlap coffee bag at upper left is taller than the blue plastic toothpaste at center right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f70a87ecf5d2ae5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and want to ensure both the blue printed fabric at center and the blue floral shirt at center are fully visible in your shot. Which one requires you to adjust your framing to include its full length?" }, { "from": "gpt", "value": "The blue floral shirt at center is taller than the blue printed fabric at center, so you need to adjust your framing to include the full length of the blue floral shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c05185e269871d2.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, white matte t-shirt at center or striped tank top at center, stands shorter?" }, { "from": "gpt", "value": "With less height is striped tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63e81aaad9ec9fbf.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a black matte jacket at center. Pinpoint a point to the black matte jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.605, 0.636)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29ece28a9852724e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.432, 0.487) or point (0.195, 0.592)?" }, { "from": "gpt", "value": "Point (0.432, 0.487)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/163f61b2e8d6e6ed.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, pink fabric hospital bed at center or white hospital gown at center?" }, { "from": "gpt", "value": "pink fabric hospital bed at center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88e8bfe12c27ce09.jpg", "conversations": [ { "from": "human", "value": "\nIs red fabric jacket at center taller than dark blue fabric at center?" }, { "from": "gpt", "value": "Indeed, red fabric jacket at center has a greater height compared to dark blue fabric at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/937c800ea36ab3b1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a portrait session. You have a camera with a lens that can focus on objects within 2 inches. You notice the smooth skin face at center and the matte red hair at center in the scene. Can your camera capture both subjects in focus simultaneously?" }, { "from": "gpt", "value": "The distance between the smooth skin face at center and the matte red hair at center is 1.99 inches, which is within the camera lens focus range of 2 inches. Therefore, the camera can capture both subjects in focus simultaneously." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c65d847238f9e87.jpg", "conversations": [ { "from": "human", "value": "\nYou are a wildlife photographer standing on the edge of the pond. You want to capture a photo of both the white glossy swan at left and the white matte swan at center in the same frame. Given that your camera has a maximum focus range of 2 meters, will you be able to include both swans in your shot?" }, { "from": "gpt", "value": "The distance between the white glossy swan at left and the white matte swan at center is 2.59 meters. Since your camera can only focus up to 2 meters, you won" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5d7d68bdd18d54c.jpg", "conversations": [ { "from": "human", "value": "\nIs rusty wood boat at center closer to the viewer compared to white cotton shirt at right?" }, { "from": "gpt", "value": "Yes, rusty wood boat at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84913bf10ee70fbc.jpg", "conversations": [ { "from": "human", "value": "\nIs pink matte blouse at left to the left of orange satin skirt at center from the viewer's perspective?" }, { "from": "gpt", "value": "Correct, you'll find pink matte blouse at left to the left of orange satin skirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e8a0d8ead265856.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the dark matte chocolate cake at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.179, 0.450)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac5c9a001c64132a.jpg", "conversations": [ { "from": "human", "value": "\nIs orange matte soccer ball at center bigger than white matte soccer player at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f3dc8576af3d460.jpg", "conversations": [ { "from": "human", "value": "\nYou are a military equipment inspector tasked with verifying the specifications of the metallic gray gun at center and the matte black goggles at center. Based on the image, which object is bigger?" }, { "from": "gpt", "value": "The metallic gray gun at center is larger in size than the matte black goggles at center, so the metallic gray gun at center is bigger." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72ba07bf04c6760e.jpg", "conversations": [ { "from": "human", "value": "\nWhere is clear water at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.397, 0.881)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75a05959aec0523e.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown wood plank at center positioned in front of dark brown wood plank at upper left?" }, { "from": "gpt", "value": "Yes, it is in front of dark brown wood plank at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b588c0b6c60b361.jpg", "conversations": [ { "from": "human", "value": "\nIs green hedge at center thinner than shiny dark gray dome at center?" }, { "from": "gpt", "value": "In fact, green hedge at center might be wider than shiny dark gray dome at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10860aa16e0bfef9.jpg", "conversations": [ { "from": "human", "value": "\nLocate camouflage fabric gun at center in the image." }, { "from": "gpt", "value": "[(0.377, 0.848)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/878bc0f70788c5b1.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the orange matte t-shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.805, 0.619)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d3d74970c3784de.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of white matte guitar at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.205, 0.569)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8398beb752b5aad.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the matte red barn at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.251, 0.380)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c36355fba34a48ee.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tourist standing at the starting point of the street. You want to take a photo of the yellow metallic tram at center from a safe distance. The tram is 40.99 meters away. Given that the recommended safe distance for photographing moving trams is 30 meters, is the current distance safe?" }, { "from": "gpt", "value": "The yellow metallic tram at center is 40.99 meters away, which exceeds the recommended safe distance of 30 meters. Therefore, the current distance is not safe for photographing the moving tram." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31839cf741b89635.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver who needs to park your vehicle under the bridge. You see the concrete textured column at center and the white plastic license plate at center. Which object is closer to the left side of the parking area?" }, { "from": "gpt", "value": "The concrete textured column at center is closer to the left side of the parking area because it is positioned to the left of the white plastic license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5473d81fd61fbb46.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.557, 0.762) from camera?" }, { "from": "gpt", "value": "The distance of point (0.557, 0.762) from camera is 3.62 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8eafbad315ad0075.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown speckled bird at upper left is shorter than blue-green metallic bird feeder at lower left?" }, { "from": "gpt", "value": "Yes, brown speckled bird at upper left is shorter than blue-green metallic bird feeder at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7f9f0e56f93fbc7.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position looking at the farm scene. There is a specific point marked at coordinates point (0.169, 0.133). How far is that point from your current position?" }, { "from": "gpt", "value": "The point (0.169, 0.133) is 21.87 meters away from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe7358ee0c5a967d.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the white bridge and want to locate the dark reflective water at center. According to the coordinates provided, in which direction should you look to find it?" }, { "from": "gpt", "value": "The dark reflective water at center is located at coordinates point (0.440, 0.678). Since you are at the center of the white bridge, you should look towards the direction indicated by those coordinates to find it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95d340e83e73cca2.jpg", "conversations": [ { "from": "human", "value": "\nWhere is orange dotted tie at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.753, 0.648)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2e6dff3e3f8ab08.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.268, 0.558)?" }, { "from": "gpt", "value": "denim jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff58dd2a98e2a7ad.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.284, 0.614) lie behind point (0.832, 0.731)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02b7f1ba53b03c44.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of rustic wooden balcony at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.320, 0.883)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44de46260949d808.jpg", "conversations": [ { "from": "human", "value": "\nBetween white and red striped tank top at center and matte red flag at right, which one is positioned lower?" }, { "from": "gpt", "value": "matte red flag at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef8d8b044d0254b0.jpg", "conversations": [ { "from": "human", "value": "\nDoes dry straw at center appear over natural straw bale at center?" }, { "from": "gpt", "value": "Indeed, dry straw at center is positioned over natural straw bale at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2535e3fb82015ad.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a dark gray cloud at upper center. Pinpoint a point to the dark gray cloud at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.487, 0.245)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97a56ec4edcfa8b8.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green leafy tree at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.328, 0.156)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6edba712a94a9c09.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance from blue matte bus at center to white matte van at left." }, { "from": "gpt", "value": "They are 19.29 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e77a5611fe7b7abb.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at left shorter than stone hut at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93f4fdf88bb78710.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear water at center is bigger than brown leafy tree at center?" }, { "from": "gpt", "value": "No, clear water at center is not bigger than brown leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca3149ade0119323.jpg", "conversations": [ { "from": "human", "value": "\nLocate all black leather shoe at lower left in the image." }, { "from": "gpt", "value": "[(0.199, 0.831)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8816dfa894bd7c86.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.952, 0.300) closer to camera compared to point (0.727, 0.381)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d3c4a44ab4a419f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the park and see the smooth bark tree at center. If you walk straight towards the tree, will you encounter the curved black metal fence before reaching it?" }, { "from": "gpt", "value": "The smooth bark tree at center is located at point (0.919, 0.298), which is beyond the curved black metal fence in the middle ground. Therefore, walking straight towards the tree would require passing through the fence first before reaching it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/963cd43d7c1e3df1.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.686, 0.666) from the camera?" }, { "from": "gpt", "value": "A distance of 22.12 inches exists between point (0.686, 0.666) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cdd5834e482e1707.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.680, 0.991) more distant than point (0.550, 0.697)?" }, { "from": "gpt", "value": "No, (0.680, 0.991) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0906e82db26d154b.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.183, 0.627) and point (0.717, 0.605), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.717, 0.605) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a9ea37ddf4a6f1a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, white printed shirt at center or white jersey at center?" }, { "from": "gpt", "value": "Positioned higher is white jersey at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/078f64c2a9603b05.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the matte pink snowsuit at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.195, 0.627)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b934a33e11331cc3.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white smooth dog at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.775, 0.431)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a859629b29387e8c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a server at a networking event and need to deliver a wine glass to the table. The table has both a clear glass wine glass at center and a translucent glass wine at center. Which one should you choose to place the new wine glass next to?" }, { "from": "gpt", "value": "You should place the new wine glass next to the translucent glass wine at center because the clear glass wine glass at center is already 1.38 meters away from it, leaving space for the new glass." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1eb49563a894424f.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte shirt at center bigger than gray fabric jacket at lower center?" }, { "from": "gpt", "value": "Incorrect, green matte shirt at center is not larger than gray fabric jacket at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/705ca5531ba4cac2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator trying to capture a photo of the weathered wood dock at center. The drone has a camera with a 100mm focal length lens. If the drone is positioned at point A, which is 10 meters away from the dock, what is the approximate distance between the drone and the dock in meters to ensure the dock fills the frame?" }, { "from": "gpt", "value": "The question cannot be answered with the provided information because the 2D coordinates of the weathered wood dock at center do not provide sufficient data about its physical dimensions or the required framing for the drone photography calculation." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b370179e16d2839.jpg", "conversations": [ { "from": "human", "value": "\nDoes purple fabric table at center have a lesser width compared to matte purple shirt at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/835f4252569a53e7.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green metal fence at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.501, 0.753)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78beb0923f9a5e3f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian standing on the sidewalk and want to cross the street to the central building. The gray concrete curb at lower center is in your way. Which direction should you move to avoid the green leafy tree at upper center and reach the curb safely?" }, { "from": "gpt", "value": "You should move to the right to avoid the green leafy tree at upper center, as it is on the left side of the gray concrete curb at lower center, allowing you to reach the curb safely." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b18284f9fe7da24e.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue shirt at center wider than matte black shirt at upper center?" }, { "from": "gpt", "value": "Correct, the width of matte blue shirt at center exceeds that of matte black shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/036c877a1a54e551.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from white fabric shoe at lower right to camera." }, { "from": "gpt", "value": "A distance of 4.32 feet exists between white fabric shoe at lower right and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6306c902ed06267.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.647, 0.827) and point (0.277, 0.520), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.277, 0.520)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54edfeb1b0c01989.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, gray rock cliff at center or orange life vest at lower left?" }, { "from": "gpt", "value": "orange life vest at lower left is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8388bd21f2f4082c.jpg", "conversations": [ { "from": "human", "value": "\nIs brown stone tower at left to the right of orange wooden clock at center from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, brown stone tower at left is not on the right side of orange wooden clock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ffc5a54942bb780.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if bamboo raft at center is positioned to the left of bamboo paddle at center?" }, { "from": "gpt", "value": "Yes, bamboo raft at center is to the left of bamboo paddle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e305dd7e97d58a8.jpg", "conversations": [ { "from": "human", "value": "\nDoes multicolored fabric top at center have a larger size compared to denim shorts at center?" }, { "from": "gpt", "value": "Indeed, multicolored fabric top at center has a larger size compared to denim shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5edda794df9ce562.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian standing on the cobblestone street and want to cross to the other side. There is a silver metallic sedan at right and a green shirt at upper left. Which object is closer to you?" }, { "from": "gpt", "value": "The silver metallic sedan at right is closer to you because the green shirt at upper left is behind it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/122a281538be9902.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte ski suit at center is positioned to the right of matte black jacket at center?" }, { "from": "gpt", "value": "Incorrect, black matte ski suit at center is not on the right side of matte black jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e629ef8609ea989.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.447, 0.591) and point (0.138, 0.506), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.138, 0.506) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12637dd83ef40d36.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy field at center is shorter than green leafy hedge at center?" }, { "from": "gpt", "value": "Incorrect, green leafy field at center's height does not fall short of green leafy hedge at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9e0841a929b203c.jpg", "conversations": [ { "from": "human", "value": "\nLocate all smooth tan skin at center in the image." }, { "from": "gpt", "value": "[(0.437, 0.519)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4273e4bb447fced3.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a fluffy yellow costume at center. Pinpoint a point to the fluffy yellow costume at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.427, 0.650)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70ae18fe7323a8e6.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.146, 0.180) or (0.735, 0.322)?" }, { "from": "gpt", "value": "Point (0.146, 0.180) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a6ab047a562e4fc.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at a distance from the table where the man in the dark sweater and the woman with the laptop are seated. If you want to place a small object exactly at the point labeled as point (0.567, 0.520), how far should you move forward from your current position to reach that point?" }, { "from": "gpt", "value": "You should move forward 3.62 meters to reach the point labeled as point (0.567, 0.520) because the distance between the point and the viewer is exactly 3.62 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/130a0ddc2c1d2f38.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green matte truck at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.697, 0.863)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/524a69207763b0bc.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.711, 0.777) positioned after point (0.634, 0.753)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afd5af7a5e940253.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.394, 0.641) or point (0.892, 0.578)?" }, { "from": "gpt", "value": "The point (0.892, 0.578) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1ffff1af2257bb5.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the brick pavement at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.429, 0.873)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5db0d329af0fcfd1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a parking attendant who needs to check license plates. You see the white plastic license plate at center and the black plastic license plate at center. Which license plate is above the other?" }, { "from": "gpt", "value": "The white plastic license plate at center is positioned over the black plastic license plate at center, so the white one is above the black one." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bb4d9b3127b2029.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, gray sweater at center or white paperboard at upper center, stands shorter?" }, { "from": "gpt", "value": "gray sweater at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d0e98acd38c6910.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the smooth concrete pillar at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.054, 0.263)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d7e2afae5a185b6.jpg", "conversations": [ { "from": "human", "value": "\nIs gray cotton t-shirt at center bigger than metallic silver microphone at lower left?" }, { "from": "gpt", "value": "Yes, gray cotton t-shirt at center is bigger than metallic silver microphone at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99f25834bcbe27c4.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the tree on the right side of the frame and want to greet both people wearing the green checkered suit at left and dark gray suit at right. Which one should you approach first based on their positions?" }, { "from": "gpt", "value": "You should approach the green checkered suit at left first since it is positioned to the left of the dark gray suit at right, meaning it is closer to your current position near the tree on the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4cbaaafac4e8e94.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.102, 0.259)?" }, { "from": "gpt", "value": "green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9214eeba1685251f.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.103, 0.689) farther from camera compared to point (0.958, 0.778)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bd2ceb111b06b59.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the light gray fabric bicycle at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.610, 0.625)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34a13ceb2d054eff.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of velvet dark green armchair at left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.209, 0.461)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfbedd60b2cf14e7.jpg", "conversations": [ { "from": "human", "value": "\nHow close is purple smooth shirt at center from camera?" }, { "from": "gpt", "value": "They are 39.25 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f84ea9548f9ca1f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a photo of the green parrot at center and the black plastic goggles at upper center in the scene. What is the distance between these two objects?" }, { "from": "gpt", "value": "The distance between the green parrot at center and the black plastic goggles at upper center is 65.02 centimeters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15e03c23b87ea5c7.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of brown sand at lower center in the image." }, { "from": "gpt", "value": "[(0.767, 0.841)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36aca54a7f0bc036.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in a garden and see two green leafy trees in the image. Which tree, the green leafy tree at upper center or the green leafy tree at center, is closer to you?" }, { "from": "gpt", "value": "The green leafy tree at upper center is closer to you because it is in front of the green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30ede54840ebc517.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the vineyard and want to take a photo of both the brown stone bell tower at right and the green leafy tree at upper right in the same frame. Which object should you position closer to the left side of your camera viewfinder to include both in the shot?" }, { "from": "gpt", "value": "You should position the brown stone bell tower at right closer to the left side of your camera viewfinder because it is located to the left of the green leafy tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40c3518b339e340c.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, brown fabric at center or white soft baby at center?" }, { "from": "gpt", "value": "white soft baby at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11eaee4cd8465be6.jpg", "conversations": [ { "from": "human", "value": "\nIs blue matte tank top at center closer to camera compared to pink fabric sandal at lower center?" }, { "from": "gpt", "value": "Yes, blue matte tank top at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04696bfe6aa4c3f2.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte car at center smaller than metallic silver car at center?" }, { "from": "gpt", "value": "Indeed, black matte car at center has a smaller size compared to metallic silver car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/691117fba625a28b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.575, 0.289)?" }, { "from": "gpt", "value": "leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c12faacb8171cea5.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any white fabric flag at upper left in the image." }, { "from": "gpt", "value": "[(0.200, 0.261)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a700c80234f8601.jpg", "conversations": [ { "from": "human", "value": "\nDoes green rubber basketball court at center appear over blue jersey at center?" }, { "from": "gpt", "value": "No, green rubber basketball court at center is not above blue jersey at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/777be422868db5e8.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.483, 0.795) and camera?" }, { "from": "gpt", "value": "Point (0.483, 0.795) is 3.90 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bad2ed9525612174.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.840, 0.683) or point (0.198, 0.527)?" }, { "from": "gpt", "value": "Positioned behind is point (0.198, 0.527)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/458fb39d0fed104f.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of matte red bag at lower left from white fabric person at lower right?" }, { "from": "gpt", "value": "matte red bag at lower left is 19.38 meters from white fabric person at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c70c5fc8e0874804.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white matte shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.644, 0.658)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7eaf47d72e3560f8.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the black baseball cap at the center. There is a point marked at coordinates (0.860, 0.273). What object is located at that point?" }, { "from": "gpt", "value": "The point at coordinates (0.860, 0.273) indicates the beige striped cardboard box at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7bcfc0a9ba540f9.jpg", "conversations": [ { "from": "human", "value": "\nIs rusty metal excavator bucket at center below blue reflective safety vest at center?" }, { "from": "gpt", "value": "Incorrect, rusty metal excavator bucket at center is not positioned below blue reflective safety vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52b832335dd50a4c.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.502, 0.809) come farther from viewer compared to point (0.274, 0.747)?" }, { "from": "gpt", "value": "No, (0.502, 0.809) is in front of (0.274, 0.747)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0547f47f80556296.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of rusty wood door at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.510, 0.230)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/780f9082d25a6c2a.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.791, 0.559) less distant than point (0.079, 0.555)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04af94805b4b0503.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.505, 0.173) in the image, which is in a rural forest area. You want to walk towards the pickup truck parked on the right side of the road. Which direction should you head to reach the pickup truck?" }, { "from": "gpt", "value": "The point (0.505, 0.173) corresponds to the green leafy tree at upper center. To reach the pickup truck parked on the right side of the road, you should head downwards from the green leafy tree at upper center towards the lower right direction." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1aa4b219775490f.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.300, 0.847) positioned after point (0.953, 0.484)?" }, { "from": "gpt", "value": "No, (0.300, 0.847) is in front of (0.953, 0.484)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5db088d151c30b42.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of green leafy tree at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.116, 0.253)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8992bce34ccc48f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the scene of a protest. You want to capture a closeup shot of the white crumpled paper at center without including the signs in the background. Given that your camera has a focal length of 50mm and you need to maintain a depth of field that blurs the background, how far should you position yourself from the paper to achieve this effect?" }, { "from": "gpt", "value": "To blur the background signs while focusing on the white crumpled paper at center, you should position yourself approximately 5.15 feet away from the paper, as it is the optimal distance for your camera settings to achieve the desired depth of field." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f34d611291eefee.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from brown dirt track at center to camera." }, { "from": "gpt", "value": "brown dirt track at center is 8.33 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84ed7e3e110abd5d.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.867, 0.531) come closer to viewer compared to point (0.952, 0.900)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19dba4647b298880.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the green leafy shrub at lower right and want to reach the green leafy trees at center. How far is the distance between them?" }, { "from": "gpt", "value": "The distance between the green leafy shrub at lower right and the green leafy trees at center is 91.33 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd1fe843f1f17f3a.jpg", "conversations": [ { "from": "human", "value": "\nLocate white matte projection screen at upper center in the image." }, { "from": "gpt", "value": "[(0.732, 0.322)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd949a94e5c52537.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green metal fence at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.129, 0.434)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0ca51557e03a70a.jpg", "conversations": [ { "from": "human", "value": "\nWhere is plaid flannel shirt at lower right located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.843, 0.919)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c6014879bca2006.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is black glossy monitor at center from white matte keyboard at center?" }, { "from": "gpt", "value": "black glossy monitor at center is 27.50 centimeters from white matte keyboard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a41191cf29a6f6cc.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.805, 0.352)?" }, { "from": "gpt", "value": "black matte hand at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4010fddbac91c1f.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.958, 0.522) or (0.581, 0.142)?" }, { "from": "gpt", "value": "The point (0.581, 0.142) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eda4bcf47faf1d5f.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.652, 0.738) and point (0.775, 0.816), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.652, 0.738) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb94dcc7b23fd2b8.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth reflective water at lower center wider than dark gray concrete people at lower center?" }, { "from": "gpt", "value": "Yes, smooth reflective water at lower center is wider than dark gray concrete people at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0693bbc8777e099.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to pink cotton shirt at center? Please provide its 2D coordinates.Where can I find pink cotton shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.858, 0.673)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64e9167208cf8db5.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.947, 0.145) from the camera?" }, { "from": "gpt", "value": "A distance of 4.33 feet exists between point (0.947, 0.145) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5666c97b4e3a4f7e.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny metallic armor at center appear over black leather armor at center?" }, { "from": "gpt", "value": "Incorrect, shiny metallic armor at center is not positioned above black leather armor at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfc4c8ff9e0ed4a6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the glasses is positioned at the coordinates point (0.488, 0.742)?" }, { "from": "gpt", "value": "The matte plastic glasses at center is located at point (0.488, 0.742)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4579ecaab260c0d1.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between stone church at center and gray stone tower at upper center." }, { "from": "gpt", "value": "A distance of 9.88 meters exists between stone church at center and gray stone tower at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9dc053c2adc518e6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light blue cotton shirt at center is thinner than beige plaid shirt at center?" }, { "from": "gpt", "value": "Correct, light blue cotton shirt at center's width is less than beige plaid shirt at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f4dee087dbe9c8b.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.972, 0.652) and camera." }, { "from": "gpt", "value": "Point (0.972, 0.652) and camera are 8.17 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/784573f08e3ccad4.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny red jacket at center appear over white sweater at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2e9cca4c9708068.jpg", "conversations": [ { "from": "human", "value": "\nYou are an event planner organizing a military ceremony. You need to ensure that the black smooth suit at center and the dark blue fabric flag at center are positioned appropriately. Based on their sizes, which object should be placed on the left side to ensure proper alignment?" }, { "from": "gpt", "value": "The black smooth suit at center has a lesser width compared to the dark blue fabric flag at center. To ensure proper alignment, the narrower black smooth suit at center should be placed on the left side so that the wider dark blue fabric flag at center can be positioned to its right, maintaining balance in the arrangement." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8809227533699d4.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of yellow-green fabric flag at upper center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.735, 0.344)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f36818133cd2dad.jpg", "conversations": [ { "from": "human", "value": "\nDoes white shirt at center have a lesser height compared to matte white shirt at center?" }, { "from": "gpt", "value": "No, white shirt at center is not shorter than matte white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64faeec92e159bc9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if velvety blue blanket at center is positioned to the left of shiny black cat at center?" }, { "from": "gpt", "value": "Correct, you'll find velvety blue blanket at center to the left of shiny black cat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/461a773cddb512ee.jpg", "conversations": [ { "from": "human", "value": "\nIs glassy white tower at center in front of green leafy tree at right?" }, { "from": "gpt", "value": "No, glassy white tower at center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2cd439988cf7e1f0.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.262, 0.952) less distant than point (0.585, 0.562)?" }, { "from": "gpt", "value": "Yes, point (0.262, 0.952) is in front of point (0.585, 0.562)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7e20795613d567d.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of bright yellow starburst at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.597, 0.044)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9708ff1cdb33f87a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a gardener planning to mow the lawn around the dark gray asphalt path at lower center and the brown wooden cabin at center. Which area requires a wider mower path?" }, { "from": "gpt", "value": "The dark gray asphalt path at lower center might require a wider mower path since it is possibly wider than the brown wooden cabin at center according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5825e6ae1212e152.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent plastic bottle at center-right have a lesser height compared to clear plastic bottle at upper center?" }, { "from": "gpt", "value": "Yes, transparent plastic bottle at center-right is shorter than clear plastic bottle at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7118c64b9d30c52a.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.795, 0.273) and camera." }, { "from": "gpt", "value": "Point (0.795, 0.273) is 4.85 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00a20986a3abbd4c.jpg", "conversations": [ { "from": "human", "value": "\nHow close is blue enamel kettle at upper left from wooden-handled metal spatula at lower center?" }, { "from": "gpt", "value": "blue enamel kettle at upper left is 2.85 inches away from wooden-handled metal spatula at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/731f034931fbef06.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the keyboard and want to place a small cup of water exactly at the point marked as point (0.514, 0.506). If the cup is 0.3 meters in diameter, will it fit without overlapping other objects?" }, { "from": "gpt", "value": "The point (0.514, 0.506) is 1.66 meters away from the camera. Since the cup is only 0.3 meters in diameter, it should fit at that position without overlapping other objects as long as there is enough space on the keyboard or nearby area. However, the description does not provide information about nearby objects at that specific location." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e4a57a0aa33335b.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.297, 0.341) and point (0.927, 0.452), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.297, 0.341)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/745c4bb1ba358566.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.835, 0.856) or (0.757, 0.883)?" }, { "from": "gpt", "value": "Point (0.757, 0.883)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20af7dab653a4560.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.579, 0.577) farther from camera compared to point (0.696, 0.988)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/877759925344c493.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the soccer match and want to capture a photo that includes both the multicolored fabric crowd at upper center and the dark blue jersey at lower right. Which object will appear larger in the photo?" }, { "from": "gpt", "value": "The multicolored fabric crowd at upper center will appear larger in the photo because it is much taller than the dark blue jersey at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3326a4cf662d25ee.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the black embroidered shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.787, 0.689)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e36d32910ecbd769.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the airport terminal and want to reach a specific point marked as point (0.667, 0.528). How far is this point from your current position?" }, { "from": "gpt", "value": "The distance of point (0.667, 0.528) from viewer is 110.97 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/227a577db55e36ab.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of green leafy tree at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.496, 0.173)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/146b7934739258cd.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who just arrived at the path. You see the dirt track at center and the brown and white fur at center. Which one is closer to the ground?" }, { "from": "gpt", "value": "The dirt track at center is positioned under brown and white fur at center, so the dirt track at center is closer to the ground." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b10d34ebc4e4634f.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is dark brown curly hair at upper left from camera?" }, { "from": "gpt", "value": "dark brown curly hair at upper left and camera are 32.85 inches apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23a2c864941a5338.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, white fabric headscarf at center or dark gray fabric dress at center right?" }, { "from": "gpt", "value": "Positioned lower is white fabric headscarf at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a51d84d49b8da2f3.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of clear water at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.740, 0.681)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/851b79412488cf21.jpg", "conversations": [ { "from": "human", "value": "\nBetween metallic chrome motorcycle at center and rubber/textured tire at lower center, which one is positioned higher?" }, { "from": "gpt", "value": "metallic chrome motorcycle at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc6c622722b64bb8.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.022, 0.994) and camera." }, { "from": "gpt", "value": "21.15 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab6e28d626ec1697.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a Halloween display and need to place a new pumpkin between the two existing pumpkins on the table. The new pumpkin must be placed to the right of the matte orange pumpkin at left but to the left of the matte orange pumpkin at center. Is this possible given their current positions?" }, { "from": "gpt", "value": "The matte orange pumpkin at center is positioned on the right side of the matte orange pumpkin at left, so there is no space between them for the new pumpkin. Therefore, it is not possible to place the new pumpkin in the specified position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c888d508d6393b87.jpg", "conversations": [ { "from": "human", "value": "\nIs silhouette leafless tree at left positioned before silhouette bare branches at upper left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8229b99c52a2f47f.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.976, 0.541) farther from viewer compared to point (0.063, 0.364)?" }, { "from": "gpt", "value": "No, (0.976, 0.541) is in front of (0.063, 0.364)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a8d7e1a6e6a3d92.jpg", "conversations": [ { "from": "human", "value": "\nHow far is green striped shirt at center from camera?" }, { "from": "gpt", "value": "green striped shirt at center is 16.01 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8bd118c23f1a77d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the riverside. You want to take a photo of the blonde hair at left and the matte red shirt at center so that both are in frame. Given that your camera has a focal length of 50mm and the minimum focusing distance is 1 meter, can you capture both subjects in the same shot without moving?" }, { "from": "gpt", "value": "The distance between the blonde hair at left and the matte red shirt at center is 5.91 meters. Since the minimum focusing distance is 1 meter, the photographer can capture both subjects in the same shot as long as they position themselves within 1 meter of the closest subject, ensuring both are within the camera range." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71051b586e2559b8.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.030, 0.102) and camera?" }, { "from": "gpt", "value": "Point (0.030, 0.102) is 21.19 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d8b648a97b80734.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.845, 0.412) or (0.953, 0.411)?" }, { "from": "gpt", "value": "The point (0.953, 0.411) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8458f0cf9754977c.jpg", "conversations": [ { "from": "human", "value": "\nLocate the red sheer dupatta at center in the image." }, { "from": "gpt", "value": "[(0.788, 0.517)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a98773fd60f96669.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the boat and want to take a photo of the person wearing the floral dress at center. Where should you look to find them?" }, { "from": "gpt", "value": "The floral dress at center is located at point (0.576, 0.817)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72ad6484b839e554.jpg", "conversations": [ { "from": "human", "value": "\nYou are a contractor assessing the kitchen area. You need to place a new appliance that requires 1.2 meters of space. The appliance is as wide as the black matte stove at lower left. Can the white glossy countertop at lower left accommodate it?" }, { "from": "gpt", "value": "The white glossy countertop at lower left is larger in size than the black matte stove at lower left. Since the appliance is as wide as the stove, and the countertop is larger, it can accommodate the appliance." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2558723ab6cfdb8c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of black plastic laptop at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.685, 0.673)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec83fed5ec7d3620.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.454, 0.828) farther from camera compared to point (0.774, 0.764)?" }, { "from": "gpt", "value": "Yes, point (0.454, 0.828) is behind point (0.774, 0.764)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c30a14701a06a2b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, green leafy tree at left or bare branches at upper right, stands taller?" }, { "from": "gpt", "value": "bare branches at upper right is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4800cf990ebd8100.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.378, 0.703) or (0.294, 0.428)?" }, { "from": "gpt", "value": "Point (0.294, 0.428)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f4adffe5dc18064.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.581, 0.825) from the camera?" }, { "from": "gpt", "value": "Point (0.581, 0.825) is 5.93 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e81fac236acc4110.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian standing on the street and see the black glass traffic light at upper center and the dark blue jeans at center. Which object is taller?" }, { "from": "gpt", "value": "The black glass traffic light at upper center is taller than the dark blue jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/922eae7dcf6f96ee.jpg", "conversations": [ { "from": "human", "value": "\nYou are a patient in the veterinary clinic and you see the light blue fabric shirt at center and the white plastic cone at center. Which object is closer to the left side of the scene?" }, { "from": "gpt", "value": "The light blue fabric shirt at center is closer to the left side of the scene because it is positioned to the left of the white plastic cone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e1c4a2be518a911.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray suit at center lie behind blonde hair at upper left?" }, { "from": "gpt", "value": "Yes, it is behind blonde hair at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afbbb0b23f8b4cb7.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.379, 0.673) or (0.777, 0.652)?" }, { "from": "gpt", "value": "Point (0.379, 0.673) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86635714bd0ff858.jpg", "conversations": [ { "from": "human", "value": "\nYou are a wildlife photographer aiming to capture both the brown speckled duck at left and the brown speckled duck at center in a single frame. Based on their positions, which duck is positioned closer to the edge of the frame?" }, { "from": "gpt", "value": "The brown speckled duck at left is closer to the edge of the frame since it is positioned at the left side, while the brown speckled duck at center is in the middle." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c3ecdede60435f3.jpg", "conversations": [ { "from": "human", "value": "\nLocate the black rubber road at center in the image." }, { "from": "gpt", "value": "[(0.495, 0.811)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51490ea4079c9a05.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the cyclist in the scene. You want to ensure both the shiny metallic bicycle at center and the neon green jersey at center are clearly visible in your photo. Given their positions, which object should you focus on to ensure both are in sharp focus?" }, { "from": "gpt", "value": "The neon green jersey at center is behind the shiny metallic bicycle at center. To ensure both are in sharp focus, you should focus on the shiny metallic bicycle at center since it is closer to the camera, and the neon green jersey at center will be in focus as it is behind it within the depth of field." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfe810791f761a64.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.551, 0.914) or point (0.322, 0.825)?" }, { "from": "gpt", "value": "Point (0.551, 0.914) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cabd677446f65f1.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange cotton shirt at center have a lesser width compared to orange fabric shirt at center?" }, { "from": "gpt", "value": "Incorrect, orange cotton shirt at center's width is not less than orange fabric shirt at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3ddfa526481268a.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the white fabric shirt at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.792, 0.255)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df1b0af7606fc776.jpg", "conversations": [ { "from": "human", "value": "\nLocate all clear water at center in the image." }, { "from": "gpt", "value": "[(0.760, 0.386)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/041ea14f4e8eff69.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.952, 0.080) or (0.370, 0.305)?" }, { "from": "gpt", "value": "Positioned in front is point (0.952, 0.080)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bf0f56934188c12.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, glassy brown building at center or green leafy tree at center?" }, { "from": "gpt", "value": "glassy brown building at center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e7641e4853a8108.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the matte black shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.480, 0.478)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0043ad4792ec271c.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the brick wall at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.539, 0.450)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dced86f2ee7abab7.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.567, 0.845) or (0.042, 0.388)?" }, { "from": "gpt", "value": "The point (0.042, 0.388) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/022f0e965abe271a.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the reflective safety vest at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.085, 0.727)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e3b1eae35640afc.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue fabric at center to the left of shiny gold crown at lower right from the viewer's perspective?" }, { "from": "gpt", "value": "Correct, you'll find matte blue fabric at center to the left of shiny gold crown at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bca467f067a74c4d.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.607, 0.666) or (0.926, 0.834)?" }, { "from": "gpt", "value": "Point (0.607, 0.666) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e726f7cc1554a54.jpg", "conversations": [ { "from": "human", "value": "\nBetween purple cotton t-shirt at center and light brown hair at center, which one is positioned higher?" }, { "from": "gpt", "value": "light brown hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d69ec5f22cd0948.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist setting up your workspace. You have a matte black pencil at center and a black leather shoe at lower left in your view. Which object is positioned higher in the image?" }, { "from": "gpt", "value": "The matte black pencil at center is positioned higher than the black leather shoe at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2808f75b5fde4a81.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the yellow leather jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.666, 0.725)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6f10c71c9a2ae19.jpg", "conversations": [ { "from": "human", "value": "\nIs brown leather jacket at center wider than brown leather jacket at right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6269f9d400aa6c3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black plastic tray at center is thinner than transparent glass wine glass at upper left?" }, { "from": "gpt", "value": "No, black plastic tray at center is not thinner than transparent glass wine glass at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57bad483b5680124.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown grassy terrain at center have a greater height compared to red fleece sweater at right?" }, { "from": "gpt", "value": "No, brown grassy terrain at center is not taller than red fleece sweater at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee59708bf7052336.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.193, 0.358) come farther from viewer compared to point (0.084, 0.734)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72f1b8eadf01a934.jpg", "conversations": [ { "from": "human", "value": "\nIs gray matte t-shirt at center wider than orange cotton t-shirt at left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d15b8c665c9ae96.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.009, 0.111) more distant than point (0.304, 0.822)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/267f30e873cdae4f.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, polished silver wheel at lower right or dark gray fabric at lower left?" }, { "from": "gpt", "value": "dark gray fabric at lower left is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6d6c834d7aec9b7.jpg", "conversations": [ { "from": "human", "value": "\nBetween green leafy tree at left and clear water at lake left, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "green leafy tree at left is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77c84c4c7182f040.jpg", "conversations": [ { "from": "human", "value": "\nYou are a guest at the birthday party and want to place a small gift between the chocolatesmoothcake at center and the matte clay piglet at center. Based on their positions, where should you place the gift?" }, { "from": "gpt", "value": "The chocolatesmoothcake at center is positioned on the left side of matte clay piglet at center, so you should place the gift between them to the right of the chocolatesmoothcake at center and to the left of the matte clay piglet at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70e489d9c490f3ce.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the scene from the balcony. You notice the matte gray shirt at center and the matte black sunglasses at center. Which object is positioned lower in the image?" }, { "from": "gpt", "value": "The matte gray shirt at center is below matte black sunglasses at center, so the matte gray shirt at center is positioned lower in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2fac488fbc3b9c0.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped fabric tie at center appear on the right side of green fabric chair at center?" }, { "from": "gpt", "value": "Incorrect, striped fabric tie at center is not on the right side of green fabric chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bef83f8e80b67065.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the living room and want to place a small decorative item between the two points, point (0.640, 0.858) and point (0.411, 0.953). Based on their positions, which point should the item be closer to in order to be centered between them?" }, { "from": "gpt", "value": "To center the decorative item between point (0.640, 0.858) and point (0.411, 0.953), it should be placed closer to point (0.411, 0.953) since point (0.640, 0.858) is in front of it, meaning the distance between them requires the item to balance their positions." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/495cfb011fded23b.jpg", "conversations": [ { "from": "human", "value": "\nLocate the gray cotton shirt at center in the image." }, { "from": "gpt", "value": "[(0.450, 0.494)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/002f2d008de2f535.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who has just finished a long walk and needs to retrieve your jacket. You see the shiny blue bicycle at right and the dark blue jacket at center. Which object is closer to you?" }, { "from": "gpt", "value": "The dark blue jacket at center is closer to you because it is located at the center of the scene, while the shiny blue bicycle at right is positioned further away on the right side. According to the description, they are 27.20 meters apart, so the jacket is nearer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60155fa0ef52295a.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gray t-shirt at center above white cotton shirt at center?" }, { "from": "gpt", "value": "Indeed, matte gray t-shirt at center is positioned over white cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a77cee90a67aaf47.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.586, 0.398) or (0.340, 0.147)?" }, { "from": "gpt", "value": "The point (0.586, 0.398) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d09bbb20f24a41d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the baby and the toys on the blanket. Since the plaid fabric blanket at center and the rubberized plastic toy at center are in the frame, which object will appear larger in your photo?" }, { "from": "gpt", "value": "The plaid fabric blanket at center will appear larger in the photo since it is taller than the rubberized plastic toy at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a64a97a416bb573.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear blue water at center come in front of white glossy boat at center?" }, { "from": "gpt", "value": "Yes, it is in front of white glossy boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4230fe3e1773f9ac.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer positioned at the back of the venue. You want to capture a photo of both the printed cotton shirt at center and the wooden acoustic guitar at center in the same frame. Based on their positions, which object should you focus on first to ensure both are in the frame?" }, { "from": "gpt", "value": "The printed cotton shirt at center is to the left of the wooden acoustic guitar at center, so you should focus on the wooden acoustic guitar at center first to ensure both are in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd84c1a6b762e02e.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any orange fabric bandana at center in the image." }, { "from": "gpt", "value": "[(0.581, 0.428)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ddeb26053061e37.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of marble column at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.676, 0.556)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e1b489950b015aa.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if striped shirt at lower left is positioned to the right of wooden table at center?" }, { "from": "gpt", "value": "Incorrect, striped shirt at lower left is not on the right side of wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e18cb9ff3b259b77.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.197, 0.955) come farther from viewer compared to point (0.859, 0.539)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53add9674dc6d7d6.jpg", "conversations": [ { "from": "human", "value": "\nBased on the coordinates provided, which object is located at point (0.149, 0.636) in the image?" }, { "from": "gpt", "value": "The point (0.149, 0.636) indicates the white knit sweater at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c92d42607581a96.jpg", "conversations": [ { "from": "human", "value": "\nHow much distance is there between dark blue leather jacket at center and smooth asphalt train track at right?" }, { "from": "gpt", "value": "dark blue leather jacket at center is 3.46 meters from smooth asphalt train track at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5dbc8c465f8c4d7.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the gray concrete beams at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.709, 0.492)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fb91bd32b39649d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.197, 0.783) or point (0.016, 0.589)?" }, { "from": "gpt", "value": "Point (0.016, 0.589)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ca1ed365780a7a8.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the dinosaur statue and notice a specific point marked at coordinates (0.489, 0.300). Based on the scene description, where is this point located relative to the dinosaur statue?" }, { "from": "gpt", "value": "The point at coordinates (0.489, 0.300) is located on green leafy plants at center, which are part of the lush green environment surrounding the dinosaur statue." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4301dff5fae04e27.jpg", "conversations": [ { "from": "human", "value": "\nHow far is green grassy pasture at center from camera?" }, { "from": "gpt", "value": "green grassy pasture at center and camera are 6.16 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b46881cff2d3393.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of maroon matte sign at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.562, 0.241)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7718159d1266e7de.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.585, 0.473)?" }, { "from": "gpt", "value": "teal fabric necklace at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31e7cd4f5a7187e6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white feathered duck at center is wider than white feathered goose at center?" }, { "from": "gpt", "value": "Incorrect, white feathered duck at center's width does not surpass white feathered goose at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b812c0b8de81dafa.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the soccer stadium. You want to take a photo of the smooth bald head at lower right and the gray cotton shirt at lower center. Which of the two objects should you focus on if you want to capture the wider one in your shot?" }, { "from": "gpt", "value": "The smooth bald head at lower right is wider than the gray cotton shirt at lower center, so you should focus on the smooth bald head at lower right to capture the wider one." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ea4e1e12b3f2a41.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of pink blossoms at center from camera?" }, { "from": "gpt", "value": "pink blossoms at center is 65.79 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e030cf9126136ec7.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of shiny green tree at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.703, 0.439)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc8b7034e237efca.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between plaid shirt at center and plaid cotton shirt at left?" }, { "from": "gpt", "value": "plaid shirt at center is 1.81 inches from plaid cotton shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f80656c93055af7.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the plaid fabric skirt at lower left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.180, 0.656)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9e3b86e9b5aac44.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.561, 0.466) or (0.857, 0.500)?" }, { "from": "gpt", "value": "The point (0.857, 0.500) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08d014c6a1a104f2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer capturing the fishing scene. You want to ensure the shiny silver fish at center and the smooth black rod at center are both visible in your shot. Based on their positions, which object should you focus on first to capture both in the frame?" }, { "from": "gpt", "value": "The shiny silver fish at center is located below the smooth black rod at center. To capture both in the frame, focus on the smooth black rod at center first, as it is above the fish, ensuring the fish remains within the lower part of the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff622fde4dc1e422.jpg", "conversations": [ { "from": "human", "value": "\nIs glossy red tomato at center behind white fabric shirt at upper center?" }, { "from": "gpt", "value": "No, it is in front of white fabric shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08edd7d6d41ac47e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a soccer referee observing the match. You notice two players, the white striped jersey at center and the blue jersey at center, are both reaching for the soccer ball. Which player is closer to the ball?" }, { "from": "gpt", "value": "The white striped jersey at center is positioned on the left side of the blue jersey at center. Since the ball is above the goalkeeper, it is likely closer to the blue jersey at center, which is positioned closer to the ball." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d89437fa27d0bb4.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to know how far the point at coordinates point (0.404, 0.503) is from you. What is the distance in meters?" }, { "from": "gpt", "value": "The distance of point (0.404, 0.503) from camera is 44.62 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a47e30843db1d27.jpg", "conversations": [ { "from": "human", "value": "\nIs translucent glass bowl at upper right to the right of white crumbly meatball at center from the viewer's perspective?" }, { "from": "gpt", "value": "Yes, translucent glass bowl at upper right is to the right of white crumbly meatball at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62e0088bd6cca21a.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.880, 0.502)?" }, { "from": "gpt", "value": "white marble pillar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/039b28864e40f550.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, maroon fabric bunk bed at center or brown wood dresser at lower right, stands taller?" }, { "from": "gpt", "value": "maroon fabric bunk bed at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72f0e83cf2d3adfd.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a white wooden clock at center. Pinpoint a point to the white wooden clock at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.512, 0.302)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7c3f16a418d5ade.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the black leather scarf at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.610, 0.702)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c4f9056050e9aed.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the green leafy tree at upper left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.396, 0.183)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc5e8359224931cc.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.036, 0.958) and camera?" }, { "from": "gpt", "value": "Point (0.036, 0.958) and camera are 13.72 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5731d3a54ff5ff4.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.769, 0.489) from camera?" }, { "from": "gpt", "value": "The distance of point (0.769, 0.489) from camera is 9.75 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab9a4553eda98e7b.jpg", "conversations": [ { "from": "human", "value": "\nIs camouflage uniform at center further to the viewer compared to white matte tank top at center?" }, { "from": "gpt", "value": "No, camouflage uniform at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39c38e1194b3af2c.jpg", "conversations": [ { "from": "human", "value": "\nIs natural wood structure at center to the right of green mossy water at lower center from the viewer's perspective?" }, { "from": "gpt", "value": "In fact, natural wood structure at center is to the left of green mossy water at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c6f89fd36b9a9a0.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, white timber-framed building at center or textured fabric clothes at lower right?" }, { "from": "gpt", "value": "white timber-framed building at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e1207022dffe8a4.jpg", "conversations": [ { "from": "human", "value": "\nBased on the scene description, where is the white cotton shirt at center located in terms of its 2D coordinates?" }, { "from": "gpt", "value": "The white cotton shirt at center is located at the 2D coordinates point (0.722, 0.647)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bdc93697fac1075.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.118, 0.731) from camera?" }, { "from": "gpt", "value": "Point (0.118, 0.731) is 7.31 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12d28eb9432da8f3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, gray cotton t-shirt at right or knitted sweater at center?" }, { "from": "gpt", "value": "gray cotton t-shirt at right is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc78821c1dcdfc32.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the image. Which direction should you move to get closer to the green leafy tree at center?" }, { "from": "gpt", "value": "Since the green leafy tree at center is located at point coordinates of (0.542, 0.217), you should move to the left to get closer to it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/130c2881d854e385.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black suit at center positioned at the back of red silk tie at left?" }, { "from": "gpt", "value": "Yes, it is behind red silk tie at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4ef8b48e871d900.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.281, 0.609) from the camera?" }, { "from": "gpt", "value": "Point (0.281, 0.609) is 12.19 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b67b77b22f45644.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at an event and need to capture a photo of the black pinstripe suit at center and the tan fabric suit at right. Which of the two suits should you focus on first if you want to highlight the larger one in your composition?" }, { "from": "gpt", "value": "The black pinstripe suit at center is bigger than the tan fabric suit at right, so you should focus on the black pinstripe suit at center first to highlight its larger size in the composition." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f1c7729f35591a3.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.646, 0.595) come farther from viewer compared to point (0.923, 0.031)?" }, { "from": "gpt", "value": "Yes, point (0.646, 0.595) is farther from viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac8a86feb8458b2f.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the white paper at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.761, 0.720)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a00f0e6e0fc5007.jpg", "conversations": [ { "from": "human", "value": "\nLocate green mossy canoe at lower center in the image." }, { "from": "gpt", "value": "[(0.791, 0.203)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fd5f7175158eff7.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.782, 0.861) in front of point (0.061, 0.445)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08fd0d045d49ee8e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.180, 0.609) positioned behind point (0.963, 0.753)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.963, 0.753)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff91bd45ec0a841a.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown glossy horse at right appear under black and white fluffy dog at left?" }, { "from": "gpt", "value": "No, brown glossy horse at right is not below black and white fluffy dog at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/424fb1820f5aeb9f.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth concrete sidewalk at center taller than shiny black leather jacket at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/667faec950cbbc6a.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the black matte hoodie at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.139, 0.603)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4851ea652f86a54.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, concrete stairs at center or dark green jacket at center?" }, { "from": "gpt", "value": "dark green jacket at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7b8acf3315c0c53.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.090, 0.633) or point (0.119, 0.573)?" }, { "from": "gpt", "value": "Positioned in front is point (0.090, 0.633)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c1ca1ee0743c4eb.jpg", "conversations": [ { "from": "human", "value": "\nIs matte yellow shirt at center to the right of khaki uniform shirt at center from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, matte yellow shirt at center is not on the right side of khaki uniform shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53aa24161223dd05.jpg", "conversations": [ { "from": "human", "value": "\nBetween brown leafy tree at center and bare branches at left, which one is positioned higher?" }, { "from": "gpt", "value": "Positioned higher is bare branches at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93f12ca9ef40f404.jpg", "conversations": [ { "from": "human", "value": "\nIs brown matte dog at center thinner than pink glossy tongue at center?" }, { "from": "gpt", "value": "Incorrect, brown matte dog at center's width is not less than pink glossy tongue at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52edd0ac361189fd.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the floral dress at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.462, 0.212)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d549462f8e7fcfc6.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tourist in Venice and see the brown brick tower at center and the matte blue shirt at center. Which object is higher in the image?" }, { "from": "gpt", "value": "The brown brick tower at center is located above the matte blue shirt at center, so it is higher in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44553a4e8d18baca.jpg", "conversations": [ { "from": "human", "value": "\nLocate all beige stone palace at center in the image." }, { "from": "gpt", "value": "[(0.669, 0.606)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf546d37ad2b073e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.738, 0.672) behind point (0.210, 0.094)?" }, { "from": "gpt", "value": "Yes, point (0.738, 0.672) is behind point (0.210, 0.094)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab7bbfb85443657d.jpg", "conversations": [ { "from": "human", "value": "\nHow close is white smooth shirt at center from white shirt at center?" }, { "from": "gpt", "value": "white smooth shirt at center and white shirt at center are 1.39 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20fd752f9e76d018.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.275, 0.486) positioned in front of point (0.250, 0.809)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed8a89e2fe0c84b5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in front of the cactus scene. You want to take a photo focusing on the fuzzy brown cactus at center without the green fuzzy cactus at lower left appearing too prominent in the background. Based on their positions, can you suggest whether you should zoom in or zoom out?" }, { "from": "gpt", "value": "The fuzzy brown cactus at center is closer to the viewer than the green fuzzy cactus at lower left. To minimize the prominence of the green fuzzy cactus at lower left in the background, you should zoom in on the fuzzy brown cactus at center. This will narrow the field of view, making the background elements smaller and less noticeable." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1661b5dae1336840.jpg", "conversations": [ { "from": "human", "value": "\nPoint to matte black jacket at center.Point to the matte black jacket at center in the image." }, { "from": "gpt", "value": "[(0.562, 0.566)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b86eb9a4cfbe588.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the distance between green leafy tree at center and brown sedimentary water at center?" }, { "from": "gpt", "value": "The distance of green leafy tree at center from brown sedimentary water at center is 17.66 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bedba3792de75265.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the blue water at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.487, 0.863)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02c0e934716162dd.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center have a greater height compared to white glossy sedan at lower left?" }, { "from": "gpt", "value": "Correct, green grass at center is much taller as white glossy sedan at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e5c859bc289bd30.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between blue tarpaulin boat at center and camera?" }, { "from": "gpt", "value": "24.00 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ac182d86f402910.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of matte black vinyl records at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.881, 0.333)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5a4c388d7ceb754.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the field and want to place a small flag at the point that is closer to you. Which point should you choose between point (0.999, 0.891) and point (0.810, 0.558)?" }, { "from": "gpt", "value": "You should choose point (0.999, 0.891) because it is closer to the camera than point (0.810, 0.558)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9acfea2f9a9795f.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a brown earthy landscape at center. Pinpoint a point to the brown earthy landscape at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.458, 0.716)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95df83731e3c61a0.jpg", "conversations": [ { "from": "human", "value": "\nLocate all smooth black suit at center in the image." }, { "from": "gpt", "value": "[(0.494, 0.341)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/205ae4bb33f92f64.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the historic stone building and want to place a 2.5 meter tall statue on the stone ledge at upper center. Can the statue fit on the ledge?" }, { "from": "gpt", "value": "The stone ledge at upper center and viewer are 6.15 meters apart, but this distance does not indicate the ledge size. The question cannot be answered with the given information." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92789317888a15ee.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, rope swing at center or matte red shorts at center?" }, { "from": "gpt", "value": "matte red shorts at center is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a6774cb5c2c0552.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red matte shirt at center is thinner than yellow fabric at center?" }, { "from": "gpt", "value": "No, red matte shirt at center is not thinner than yellow fabric at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8cf3e4d12bbb3a5.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, green leafy tree at center-right or green leafy tree at upper center?" }, { "from": "gpt", "value": "green leafy tree at center-right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f616b389c4354f0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in the hallway and want to take a photo of both the purple satin dress at center and the yellow matte shirt at center. Which one should you focus on first to ensure both are in clear focus?" }, { "from": "gpt", "value": "The purple satin dress at center is closer to the viewer than the yellow matte shirt at center, so you should focus on the purple satin dress at center first to ensure both are in clear focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e495271b213aa4c.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of whiteboard at upper center more distant than that of white paper list at center?" }, { "from": "gpt", "value": "No, whiteboard at upper center is in front of white paper list at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92fd67bb298ce448.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between black matte tennis racket at center and camera?" }, { "from": "gpt", "value": "black matte tennis racket at center and camera are 27.98 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/982c1cc6812ad196.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green textured dress at center is taller than matte black shirt at center?" }, { "from": "gpt", "value": "Incorrect, green textured dress at center's height is not larger of matte black shirt at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57f8e7631c19725a.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between shiny black jacket at center and smooth black suit at upper right?" }, { "from": "gpt", "value": "30.20 inches" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d01452ee79db1b60.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the yellow matte helmet at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.658, 0.519)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e928a49ee8b85d8e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to load a large package onto the white metallic ramp at center. The package is as big as the matte black bus at center. Can the ramp handle the size of the package?" }, { "from": "gpt", "value": "The matte black bus at center is bigger than the white metallic ramp at center, so the ramp cannot handle the size of the package since it is smaller than the bus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a75edc918bac00e.jpg", "conversations": [ { "from": "human", "value": "\nBetween green grassy at center and clear blue water at left, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "Positioned to the left is clear blue water at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22e4f00a00c219ef.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.889, 0.564) come behind point (0.971, 0.678)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf10d1140222aa5b.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black matte blazer at left located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.163, 0.672)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a37193d62ad1e84.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.483, 0.559) and camera." }, { "from": "gpt", "value": "Point (0.483, 0.559) is 7.29 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69d7d241c70f9434.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red fabric jacket at center is smaller than black paper at left?" }, { "from": "gpt", "value": "Incorrect, red fabric jacket at center is not smaller in size than black paper at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d607c7120d6cdbcd.jpg", "conversations": [ { "from": "human", "value": "\nIs asphalt at center above yellow matte motorcycle at left?" }, { "from": "gpt", "value": "Incorrect, asphalt at center is not positioned above yellow matte motorcycle at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b54e1cee34ef896d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, floral fabric blouse at center or pink fabric shirt at center, stands shorter?" }, { "from": "gpt", "value": "With less height is pink fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6102a42c73efcb6b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the wooden framed artwork at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.120, 0.144)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/645f38c8a5f422b0.jpg", "conversations": [ { "from": "human", "value": "\nPoint to metallic gray garage door at left.Point to the metallic gray garage door at left in the image." }, { "from": "gpt", "value": "[(0.074, 0.653)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4419da41eff305e2.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to walk to the smooth sand at lower center. How far do you need to walk?" }, { "from": "gpt", "value": "The smooth sand at lower center is 4.62 meters away from the camera, so you need to walk 4.62 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da7d1974f474496d.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a networking event and need to retrieve a bag from the floor. You see the yellow fabric backpack at center and the brown canvas bag at left. Which bag is covering the other one?" }, { "from": "gpt", "value": "The yellow fabric backpack at center is positioned over the brown canvas bag at left, so the yellow one is covering the brown one." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/002396044aabf224.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is velvet black blazer at left from camera?" }, { "from": "gpt", "value": "A distance of 4.28 meters exists between velvet black blazer at left and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b93e3e01e5dfc388.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of Cahaya Hall and want to take a photo of the two points mentioned. Which point, point (0.513, 0.705) or point (0.721, 0.684), will appear larger in your camera view?" }, { "from": "gpt", "value": "Point (0.513, 0.705) will appear larger in the camera view because it is closer to the camera than point (0.721, 0.684)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b7e710321335c23.jpg", "conversations": [ { "from": "human", "value": "\nBetween purple glossy balloon at upper right and pink glossy balloon at upper right, which one is positioned lower?" }, { "from": "gpt", "value": "pink glossy balloon at upper right is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8831ff8e9626418.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white paper plate at lower center is positioned above silver metallic fork at plate center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6e02a55b9973751.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.311, 0.825) lie behind point (0.367, 0.787)?" }, { "from": "gpt", "value": "No, it is in front of (0.367, 0.787)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90214a4d1e835bb3.jpg", "conversations": [ { "from": "human", "value": "\nPoint to translucent glass tea at center.Point to the translucent glass tea at center in the image." }, { "from": "gpt", "value": "[(0.458, 0.592)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0faebcc442a56db3.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.160, 0.505) come behind point (0.953, 0.627)?" }, { "from": "gpt", "value": "No, (0.160, 0.505) is in front of (0.953, 0.627)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9a0515d726d3bab.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green matte tree at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.016, 0.900)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d976b898d063a952.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of smooth white shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.648, 0.372)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7f46accda32737a.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.496, 0.570) or (0.342, 0.436)?" }, { "from": "gpt", "value": "Point (0.496, 0.570)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5839f3bc21bfd74.jpg", "conversations": [ { "from": "human", "value": "\nIs stone statue at upper center positioned before matte stone baby at center?" }, { "from": "gpt", "value": "Yes, it is in front of matte stone baby at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d04c45a5a9093451.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green water at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.492, 0.830)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72d01258dc1a4f24.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white matte cow at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.210, 0.491)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/736cb8f278982d39.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of gray stone column at center more distant than that of smooth gray column at center?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4db15ba842baccf8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.474, 0.653)?" }, { "from": "gpt", "value": "matte red backpack at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d70696d86f2bc539.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange fabric shirt at center is positioned to the right of light blue striped shirt at center?" }, { "from": "gpt", "value": "Correct, you'll find orange fabric shirt at center to the right of light blue striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17f003fbdc0ec1ef.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.672, 0.153) and camera?" }, { "from": "gpt", "value": "They are 19.06 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/464b7084ad087e0a.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, matte black magazine at center or floral ceramic mug at upper center?" }, { "from": "gpt", "value": "matte black magazine at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1092dfb2598694c4.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, orange jersey at center or blonde hair at center?" }, { "from": "gpt", "value": "From the viewer's perspective, orange jersey at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2fe93ea24ce0353b.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, gray matte shirt at center or camouflage uniform at center?" }, { "from": "gpt", "value": "Positioned higher is camouflage uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c5f31316d81dc20.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.483, 0.695) or point (0.108, 0.875)?" }, { "from": "gpt", "value": "The point (0.483, 0.695) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90218ca152e11d17.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker trying to find the best spot to take a photo of both the green matte evergreen tree at left and the yellow leafy tree at center. Since you want both in the frame, which side of the road should you stand on?" }, { "from": "gpt", "value": "You should stand on the right side of the road because the green matte evergreen tree at left is to the left of the yellow leafy tree at center, so positioning yourself on the right side will allow you to capture both trees in the same frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d0cf323b0f577f4.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of blue striped shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.589, 0.620)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/948f43dd5add4f17.jpg", "conversations": [ { "from": "human", "value": "\nBetween green leafy tree at upper center and green leafy palm tree at center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "green leafy tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bfda7f67b7a9be8.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to green mossy cliff at lower left? Please provide its 2D coordinates.Where can I find green mossy cliff at lower left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.309, 0.900)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a7d4ce28db098f4.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the hallway outside the kitchen and looking through the doorway. You see two points marked in the kitchen. Which point is closer to you, point (0.582, 0.555) or point (0.813, 0.803)?" }, { "from": "gpt", "value": "Point (0.582, 0.555) is closer to you because it is further to the viewer than point (0.813, 0.803)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b23093ef45a4fbf5.jpg", "conversations": [ { "from": "human", "value": "\nIs black textured placemat at lower center above pink matte shirt at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/355cf6f5ef6c6184.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between white cotton t-shirt at center and camera?" }, { "from": "gpt", "value": "white cotton t-shirt at center is 2.91 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f08661224896529.jpg", "conversations": [ { "from": "human", "value": "\nBetween brown wooden train track at center and dark blue jeans at right, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "dark blue jeans at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a4561c964d6df3c.jpg", "conversations": [ { "from": "human", "value": "\nBetween black matte keyboard at lower center and natural wood laptop stand at center, which one is positioned higher?" }, { "from": "gpt", "value": "Positioned higher is natural wood laptop stand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74a1cfe26dae02d1.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of green leafy hedge at lower left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.117, 0.823)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78409e1fe08edcaa.jpg", "conversations": [ { "from": "human", "value": "\nIs gray wool suit at right thinner than red dotted dress at center?" }, { "from": "gpt", "value": "Yes, gray wool suit at right is thinner than red dotted dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1e7bff37cc55796.jpg", "conversations": [ { "from": "human", "value": "\nPoint to dark brown leather jacket at lower center.Point to the dark brown leather jacket at lower center in the image." }, { "from": "gpt", "value": "[(0.182, 0.662)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e14a189c8108fb6.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.238, 0.959) lie in front of point (0.900, 0.805)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.900, 0.805)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6e3092674b8275c.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black shirt at left appear on the left side of matte black shirt at center?" }, { "from": "gpt", "value": "In fact, matte black shirt at left is to the right of matte black shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e66860cb4d610d4.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.352, 0.789) from camera?" }, { "from": "gpt", "value": "The distance of point (0.352, 0.789) from camera is 94.18 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a210c8289a4fb79.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white stone column at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.579, 0.805)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a4093e51196b139.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green leafy tree at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.785, 0.225)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7578d73e134fbc1e.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.347, 0.902) and point (0.083, 0.764), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.083, 0.764) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8229529c03f4af0d.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the matte white helmet at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.055, 0.502)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23ce4ef8730ab3cb.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.371, 0.422) and point (0.409, 0.411), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.371, 0.422) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8db336bab3584435.jpg", "conversations": [ { "from": "human", "value": "\nBased on the scene description, where is the transparent wet concrete at lower center located in terms of coordinates?" }, { "from": "gpt", "value": "The transparent wet concrete at lower center is located at coordinates point (0.319, 0.758)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b875c7282ff17416.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who wants to cross a rocky area. You see a gray rough boulder at lower left and a dark gray fabric at lower left. Which one is shorter?" }, { "from": "gpt", "value": "The gray rough boulder at lower left is shorter than the dark gray fabric at lower left according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a818e746b02560f5.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of golden dry wheat field at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.535, 0.477)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/322ee73fa14fe7d8.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.335, 0.688) or (0.649, 0.981)?" }, { "from": "gpt", "value": "Positioned in front is point (0.649, 0.981)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01f998a08f52513d.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.548, 0.355)?" }, { "from": "gpt", "value": "black matte nokia n95 8gb at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26ecfdec7ad52191.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green translucent water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.604, 0.569)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc905016c316209d.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a smooth gray sweater at center. Pinpoint a point to the smooth gray sweater at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.222, 0.812)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2688c5caa52efb4f.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth concrete pavement at center appear over dark blue jacket at center?" }, { "from": "gpt", "value": "Correct, smooth concrete pavement at center is located above dark blue jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b950679a9645533d.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between gray rock formation at center and dark gray fleece jacket at center." }, { "from": "gpt", "value": "A distance of 157.19 meters exists between gray rock formation at center and dark gray fleece jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e12f2ac798165c8b.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the olive green quilted jacket at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.707, 0.639)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce7b6ca171f337ba.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric pants at lower right bigger than dark blue jeans at center?" }, { "from": "gpt", "value": "Correct, blue fabric pants at lower right is larger in size than dark blue jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2f21e97ec3da2d4.jpg", "conversations": [ { "from": "human", "value": "\nHow close is shiny orange tomato at center from camera?" }, { "from": "gpt", "value": "shiny orange tomato at center and camera are 23.68 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9c254f98d8c0911.jpg", "conversations": [ { "from": "human", "value": "\nDoes black hoodie at left appear on the right side of purple matte backpack at center?" }, { "from": "gpt", "value": "In fact, black hoodie at left is to the left of purple matte backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07baafa0d62395bb.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the scene. You want to take a photo of the matte beige jacket at center. How far should you position yourself from the jacket to capture it clearly?" }, { "from": "gpt", "value": "You should position yourself 13.78 feet away from the matte beige jacket at center to capture it clearly, as that is the distance it is from the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c87364604294059f.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, dark blue sweater at left or woven rattan stool at center?" }, { "from": "gpt", "value": "Positioned to the right is woven rattan stool at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4745ffec427826f8.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.327, 0.752) and point (0.558, 0.536), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.327, 0.752) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abd628a16476d948.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.468, 0.947) come in front of point (0.022, 0.625)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.022, 0.625)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8f4e7ae50c0aea4.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, white textured cookies at upper right or green textured cookie at upper right?" }, { "from": "gpt", "value": "white textured cookies at upper right is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1fc7e75a4034c08b.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance measurement between snowy rocky mountain at center and white fluffy snowman at lower left?" }, { "from": "gpt", "value": "They are 225.65 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a30a2ce6c3c5b9ec.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of brown wooden rail at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.381, 0.656)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/820ef4b4d289bb96.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.217, 0.745) lie in front of point (0.504, 0.547)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98b964246afa5e19.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the white glossy tablet at upper left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.264, 0.500)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d441e11ab74c4a8.jpg", "conversations": [ { "from": "human", "value": "\nBetween white glossy drawer at lower left and gold polished faucet at upper left, which one is positioned higher?" }, { "from": "gpt", "value": "gold polished faucet at upper left is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff6a1710141bb484.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of red knitted scarf at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.651, 0.688)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5fe6a1e7d628695.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.348, 0.752)?" }, { "from": "gpt", "value": "pink matte tulip at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78dc26e6377e8126.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the metallic silver record player at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.149, 0.489)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/505404bfe2f7f231.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the spotted fur cheetah at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.572, 0.847)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c916af481b51c00.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of green leafy tree at left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.117, 0.506)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7e27e97901162c6.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of transparent glass door at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.359, 0.211)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ceb3a49bd827f1db.jpg", "conversations": [ { "from": "human", "value": "\nIs speckled feathered bird at center below brown rough rock at lower right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cd47879f9fb01e8.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.439, 0.864) come farther from viewer compared to point (0.889, 0.320)?" }, { "from": "gpt", "value": "No, (0.439, 0.864) is in front of (0.889, 0.320)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2eb3744763a39abb.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at a party and need to ensure all guests are visible in the group photo. The two central women are wearing a multicolored printed dress at center and a white lace tank top at center. Which clothing item will appear bigger in the photo?" }, { "from": "gpt", "value": "The multicolored printed dress at center will appear bigger in the photo because it has a larger size compared to the white lace tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e47bad90d811327.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.297, 0.919) from camera?" }, { "from": "gpt", "value": "Point (0.297, 0.919) is 13.65 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6157497a75510d3.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, matte black mannequin at left or matte pink dress at center?" }, { "from": "gpt", "value": "With less height is matte pink dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30dc5c0b5b460d03.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a brown fur dog at center. Pinpoint a point to the brown fur dog at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.461, 0.583)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a70de2286df381ae.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow paper sign at center is positioned above black plastic sunglasses at center?" }, { "from": "gpt", "value": "Yes, yellow paper sign at center is above black plastic sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2fdc71e5bdaf2c7.jpg", "conversations": [ { "from": "human", "value": "\nYou are sitting in the front row of the conference room and see two points projected on the screen. The points are labeled as point (0.311, 0.472) and point (0.647, 0.662). Which point is closer to you?" }, { "from": "gpt", "value": "Point (0.311, 0.472) is closer to the viewer than point (0.647, 0.662)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1711faa11d439d0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian standing at the crosswalk and see the denim jeans at center and the white plastic license plate at center. Which object is higher from the ground?" }, { "from": "gpt", "value": "The denim jeans at center is above the white plastic license plate at center, so the denim jeans at center is higher from the ground." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5552e3c0e77300f.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist analyzing a portrait. You notice two elements in the image, the black glittery eye at center and the matte black eye at upper left. Which of these two elements is smaller in size?" }, { "from": "gpt", "value": "The black glittery eye at center is smaller than the matte black eye at upper left according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90ceb155bb1f5551.jpg", "conversations": [ { "from": "human", "value": "\nHow close is matte glass bottle at center from wooden table at center?" }, { "from": "gpt", "value": "matte glass bottle at center and wooden table at center are 27.59 centimeters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66742c95a286505a.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink fabric shirt at upper right have a lesser height compared to black plastic goggles at lower center?" }, { "from": "gpt", "value": "In fact, pink fabric shirt at upper right may be taller than black plastic goggles at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95497d61e56b3cba.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of light brown leather jacket at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.486, 0.717)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d562be88dfd4c1e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a nurse assessing a patient with an injured toe. You notice the yellowish skin at center and the white fabric bandage at center. Which object is larger in size?" }, { "from": "gpt", "value": "The white fabric bandage at center is larger than the yellowish skin at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19e021bad1378364.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, brown gravel train track at bottom or green leafy tree at center?" }, { "from": "gpt", "value": "green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25726542c19e1e21.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.115, 0.541) and camera?" }, { "from": "gpt", "value": "They are 5.23 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c35a2be22610c41c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the river and see the green leafy tree at upper left. If you want to walk directly towards it, how many meters would you have to walk to reach it?" }, { "from": "gpt", "value": "The green leafy tree at upper left is 35.86 meters from viewer, so you would have to walk 35.86 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02f5d1eea370297b.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of shiny black sedan at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.927, 0.625)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bff3de745046f1e.jpg", "conversations": [ { "from": "human", "value": "\nBetween white leather shoe at upper right and white leather shoe at lower right, which one is positioned lower?" }, { "from": "gpt", "value": "Positioned lower is white leather shoe at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0378edbaa5d9a257.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.491, 0.228) and camera." }, { "from": "gpt", "value": "Point (0.491, 0.228) and camera are 12.43 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c40448004ab971b2.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, gray/dry bush at lower left or green spiny bush at center?" }, { "from": "gpt", "value": "green spiny bush at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cafa33c7a1bbaff8.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of orange/white striped cone at right. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.895, 0.527)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e44a117e2ea5e0f.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.526, 0.598) or point (0.738, 0.233)?" }, { "from": "gpt", "value": "Positioned in front is point (0.526, 0.598)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af3edadc663e2fd7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow plastic barrier at left is shorter than white metallic truck at upper center?" }, { "from": "gpt", "value": "Correct, yellow plastic barrier at left is not as tall as white metallic truck at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8f024bf2f18a6e6.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black monitor at left appear on the right side of dark hair at center?" }, { "from": "gpt", "value": "In fact, matte black monitor at left is to the left of dark hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0903c1c89bfcd2dd.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.385, 0.572) or point (0.639, 0.619)?" }, { "from": "gpt", "value": "Point (0.385, 0.572)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83a64219ecc6674f.jpg", "conversations": [ { "from": "human", "value": "\nPoint to polished glass globe at center.Point to the polished glass globe at center in the image." }, { "from": "gpt", "value": "[(0.759, 0.791)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03ee9fb63d79296d.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the denim jeans at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.045, 0.698)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/528c1873cca0ed44.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the clear glass window at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.034, 0.234)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48420b94dda02552.jpg", "conversations": [ { "from": "human", "value": "\nLocate all dark gray suit at lower right in the image." }, { "from": "gpt", "value": "[(0.872, 0.833)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec404600fb119271.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.142, 0.636) closer to viewer compared to point (0.492, 0.577)?" }, { "from": "gpt", "value": "No, (0.142, 0.636) is behind (0.492, 0.577)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d6470e969ace75d.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.515, 0.464) and camera." }, { "from": "gpt", "value": "A distance of 1.26 meters exists between point (0.515, 0.464) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3893f42f39b38de1.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of golden crispy balls at right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.768, 0.512)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a20667a0bc0be9b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the promenade and want to take a photo of both point (0.771, 0.861) and point (0.414, 0.844) in the scene. Which point should you focus on first to ensure both are in clear view?" }, { "from": "gpt", "value": "You should focus on point (0.771, 0.861) first because it is closer to you than point (0.414, 0.844), ensuring both points are in clear view." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91edf55aee0ab5bb.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.619, 0.536) to camera." }, { "from": "gpt", "value": "Point (0.619, 0.536) and camera are 12.40 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad1ff53ed3924684.jpg", "conversations": [ { "from": "human", "value": "\nDoes black sand at lower center have a greater height compared to blue floral kimono at center?" }, { "from": "gpt", "value": "In fact, black sand at lower center may be shorter than blue floral kimono at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d41bd20d19ffaee2.jpg", "conversations": [ { "from": "human", "value": "\nIs brass/bronze pillar at left below light green leather armchair at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df5f9d7bf4d4e508.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear water at lower right come behind green fuzzy glove at lower left?" }, { "from": "gpt", "value": "Yes, it is behind green fuzzy glove at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/250a0b8da75cb9f1.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.446, 0.844) or (0.355, 0.714)?" }, { "from": "gpt", "value": "Positioned behind is point (0.355, 0.714)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f7bad74f8391b6c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of brown tiled dome at upper center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.722, 0.239)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bb5910c00d46a18.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.993, 0.478) come behind point (0.547, 0.266)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e179ece9d2f5c308.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the scene and see the dark brown leather jacket at lower left and the dark blue fabric at lower left. Which object is located to the right of the other?" }, { "from": "gpt", "value": "The dark brown leather jacket at lower left is positioned on the right side of dark blue fabric at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/123c25baf3a599ab.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of brown leather overalls at right in the image." }, { "from": "gpt", "value": "[(0.889, 0.586)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20c8612431e21c33.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the shiny gold robe at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.279, 0.498)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/302e5cc7f02b0864.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow matte bus at center is taller than matte black poster at center?" }, { "from": "gpt", "value": "Yes, yellow matte bus at center is taller than matte black poster at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3abd98ed5b6678ca.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the Microsoft office building and want to know how far you are from the point marked at coordinates point (0.606, 0.498). Can you determine the distance from your current position to that point?" }, { "from": "gpt", "value": "The distance of point (0.606, 0.498) from the camera is 44.81 meters, so you are 44.81 meters away from that point." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db045c0c51a13637.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.336, 0.420)?" }, { "from": "gpt", "value": "checkered fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afcaa3e6c4dc22fa.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green glass bus stop at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.115, 0.459)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2685ac8507e068ac.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between shiny black tuxedo at center and camera?" }, { "from": "gpt", "value": "shiny black tuxedo at center is 4.57 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21922685a0e62ff2.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the dull concrete steps at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.355, 0.812)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d7c94ebab74fef4.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte tree at left taller than green matte tree at center?" }, { "from": "gpt", "value": "Yes, green matte tree at left is taller than green matte tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c99007141b541a0.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.490, 0.734) more distant than point (0.883, 0.555)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2856fd1c33098c40.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.202, 0.600) or point (0.530, 0.845)?" }, { "from": "gpt", "value": "Point (0.530, 0.845)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c904f1fb8a0bf024.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, green leafy tree at left or green grassy hillside at upper center?" }, { "from": "gpt", "value": "green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be33077a4eedfd83.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, light blue shirt at center or dark gray pants at center?" }, { "from": "gpt", "value": "light blue shirt at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0572cb65e9382ba2.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of matte black doll at center from white matte shoe at lower left?" }, { "from": "gpt", "value": "They are 46.36 centimeters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/edda38265e38e3ed.jpg", "conversations": [ { "from": "human", "value": "\nDoes green textured tree at upper center have a larger size compared to green coniferous tree at upper center?" }, { "from": "gpt", "value": "Yes, green textured tree at upper center is bigger than green coniferous tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18a965ba802f916f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the helipad and want to approach the glossy asphalt tarmac at center to inspect it. What is the distance you need to cover to reach it?" }, { "from": "gpt", "value": "The distance between you and the glossy asphalt tarmac at center is 4.47 meters, so you need to cover 4.47 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/641164ae0ad611d1.jpg", "conversations": [ { "from": "human", "value": "\nIs teal fabric chair at right taller than teal fabric chair at left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5317ed3df472e7b0.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the shiny green sequins at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.695, 0.772)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9a3e648c1525036.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any dark gray fabric shirt at center in the image." }, { "from": "gpt", "value": "[(0.393, 0.487)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b50c5145a664ab10.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of red plaid vest at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.569, 0.734)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b94b3e725a2a238.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden bridge at center have a greater width compared to rustic stone hut at upper center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d50d524ae94364c4.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.588, 0.445) or (0.900, 0.412)?" }, { "from": "gpt", "value": "Point (0.588, 0.445) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d3aa869eb321967.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.396, 0.455) or (0.328, 0.138)?" }, { "from": "gpt", "value": "Positioned in front is point (0.396, 0.455)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65c5bc9e6d5d2104.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, white shirt at center or green fabric table at lower left, stands taller?" }, { "from": "gpt", "value": "white shirt at center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/309a05c7b93fcb2d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to brown wood tree branch at center.Point to the brown wood tree branch at center in the image." }, { "from": "gpt", "value": "[(0.784, 0.678)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52766e65da7908e8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black storefront at center is bigger than yellow painted curb at lower center?" }, { "from": "gpt", "value": "Indeed, matte black storefront at center has a larger size compared to yellow painted curb at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff406baf7184eb1d.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.789, 0.375) farther from viewer compared to point (0.353, 0.616)?" }, { "from": "gpt", "value": "Yes, point (0.789, 0.375) is farther from viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/059b80de3b976cb9.jpg", "conversations": [ { "from": "human", "value": "\nYou are an animal researcher observing the squirrel in the image. You need to determine which part of the squirrel is wider when viewed from above. Which is wider, the brown fur squirrel at center or the brown fuzzy tail at center?" }, { "from": "gpt", "value": "The brown fur squirrel at center is wider than the brown fuzzy tail at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc7732ee6a0d0f99.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.225, 0.806)?" }, { "from": "gpt", "value": "wooden polished boat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46a19d03204c5e50.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the matte yellow balloon at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.595, 0.512)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/586573b9bca807bb.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of brown smooth hair at upper center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.639, 0.225)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cefb355c7201b5f.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of yellow metallic bus at right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.951, 0.555)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0126565c0fa71927.jpg", "conversations": [ { "from": "human", "value": "\nIs pink fabric shorts at lower left smaller than light brown sand at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/619d4237899c7a93.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, brown rough log at center or spotted fur leopard at center?" }, { "from": "gpt", "value": "Positioned higher is spotted fur leopard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3dbded526577047.jpg", "conversations": [ { "from": "human", "value": "\nIs dark blue fabric bag at lower left further to the viewer compared to black matte vest at center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/522a33d6279550f1.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.573, 0.522) lie in front of point (0.320, 0.448)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd3dfa524f23c746.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.443, 0.805) or (0.538, 0.427)?" }, { "from": "gpt", "value": "The point (0.538, 0.427) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b75a5dddce27b0c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian walking along the wet brick street and notice the RAFA stall with its blue canopy. You see a white glossy van at center and light brown hair at lower left. Which object is positioned more to the east? Please answer based on the scene orientation where the stall faces north." }, { "from": "gpt", "value": "The white glossy van at center is to the right of light brown hair at lower left. Since the stall faces north, right would correspond to the east direction. Therefore, the white glossy van at center is positioned more to the east." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9a3d63f505d8acc.jpg", "conversations": [ { "from": "human", "value": "\nYou are a bird looking for a nesting spot. You want to choose the taller tree between the green leafy tree at left and the green leafy tree at right. Which one should you choose?" }, { "from": "gpt", "value": "The green leafy tree at right is taller than the green leafy tree at left, so you should choose the green leafy tree at right for nesting." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5f62c87d9ecb639.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked by the coordinates point (0.726, 0.169) in front of the grand Gothic cathedral. Which architectural feature of the cathedral does this point indicate?" }, { "from": "gpt", "value": "The point (0.726, 0.169) marks the stone gothic tower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43558e60aa637e7b.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.700, 0.113) come behind point (0.377, 0.103)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23d6a2a9f7b633c7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if glossy black car at center is smaller than matte silver convertible at center?" }, { "from": "gpt", "value": "No, glossy black car at center is not smaller than matte silver convertible at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1089c3d572d14fc0.jpg", "conversations": [ { "from": "human", "value": "\nLocate all wooden roller coaster at center in the image." }, { "from": "gpt", "value": "[(0.600, 0.461)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47f679ceee171d18.jpg", "conversations": [ { "from": "human", "value": "\nYou are an art conservator examining the display case containing the preserved body of Saint Faustina. You notice a point marked at coordinates (0.181, 0.894). Based on the scene description, what object is located at this point?" }, { "from": "gpt", "value": "The point at coordinates (0.181, 0.894) indicates the location of the gold ornate frame at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d93847a14253f013.jpg", "conversations": [ { "from": "human", "value": "\nIs leather jacket at lower right to the left of plaid fabric shirt at center from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, leather jacket at lower right is not on the left side of plaid fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70a56f144e8fc8d0.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white matte car at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.422, 0.736)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4d6cfcb7846eb52.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.176, 0.725) positioned after point (0.808, 0.542)?" }, { "from": "gpt", "value": "No, (0.176, 0.725) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43084348a489a7d2.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of blue water at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.503, 0.192)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7eab9db512019a75.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue matte train at center is positioned to the left of metallic blue bicycle at center?" }, { "from": "gpt", "value": "Indeed, blue matte train at center is positioned on the left side of metallic blue bicycle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/673ed2d8945a68cf.jpg", "conversations": [ { "from": "human", "value": "\nYou are at an outdoor event and see two people at the center wearing a navy fleece jacket at center and a red plaid shirt at center. Which one is on the left side?" }, { "from": "gpt", "value": "The navy fleece jacket at center is on the left side of the red plaid shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4281407137dacc0.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the gray fabric jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.313, 0.750)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b803eac2ac7b231.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.190, 0.250)?" }, { "from": "gpt", "value": "green textured pine tree at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddbd4a993e001bc0.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.545, 0.648)?" }, { "from": "gpt", "value": "shiny blue peacock at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ea5fd459601ef67.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a candid shot of the two people in the scene. You notice the matte blue shirt at left and the black fabric strap at right. Which object should you focus on if you want to capture the taller one?" }, { "from": "gpt", "value": "The matte blue shirt at left is taller than the black fabric strap at right, so you should focus on the matte blue shirt at left to capture the taller one." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5dbf06494224b86.jpg", "conversations": [ { "from": "human", "value": "\nWhere is tan leather trench coat at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.767, 0.411)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2fdf5b2c33e15e27.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, black textured hair at upper right or brown matte hair at center?" }, { "from": "gpt", "value": "black textured hair at upper right is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42d9c639f61a5cad.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the matte black dress at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.600, 0.672)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bad50aa259ef6a47.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.719, 0.645) and point (0.263, 0.463), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.263, 0.463) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/879d2e9ff8055ef3.jpg", "conversations": [ { "from": "human", "value": "\nIs red shirt at right bigger than yellow fabric at center?" }, { "from": "gpt", "value": "No, red shirt at right is not bigger than yellow fabric at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91d19a5919254eca.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.134, 0.495) less distant than point (0.203, 0.872)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4108dcbae30dd949.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of dark brown leather jacket at lower right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.838, 0.961)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58e8dbb939634568.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the beach and want to take a photo of the green smooth water at center. Where should you position yourself to capture the water in the center of your camera frame?" }, { "from": "gpt", "value": "Position yourself directly in front of the green smooth water at center, as its 2D coordinates are at point (0.619, 0.539), which is the center of the image. Align your camera to focus on that point to capture the water in the center of your frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/316eed02c4ef8ce3.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any concrete pavement at center in the image." }, { "from": "gpt", "value": "[(0.444, 0.877)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d94a0ef6c035a116.jpg", "conversations": [ { "from": "human", "value": "\nYou are packing for a trip and have two items in your view. You need to choose the larger one to carry more clothes. Which one should you pick between the gray fabric duffel at lower right and the matte black backpack at upper center?" }, { "from": "gpt", "value": "The gray fabric duffel at lower right is larger in size than the matte black backpack at upper center, so you should choose the gray fabric duffel at lower right to carry more clothes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea3daccfcb4864be.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a clear shot of the white cotton shirt at center during the protest. However, the multicolored fabric crowd at center is blocking your view. Based on the scene description, can you determine if the crowd is between you and the shirt, or behind the shirt?" }, { "from": "gpt", "value": "The multicolored fabric crowd at center is above the white cotton shirt at center, so the crowd is positioned higher up and might not block the view directly. Adjust your angle to look downward or move to a higher vantage point to capture the shirt without obstruction." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6eee726d7092fd9.jpg", "conversations": [ { "from": "human", "value": "\nLocate metallic orange boat at upper center in the image." }, { "from": "gpt", "value": "[(0.285, 0.656)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e72c82427ce3c60.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown rough stone at lower center is positioned below green stone castle at center?" }, { "from": "gpt", "value": "Indeed, brown rough stone at lower center is positioned under green stone castle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/753c41507351515b.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.381, 0.680) and point (0.311, 0.770), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.311, 0.770)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb5cfef97283b1a0.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the light brown wooden bicycle at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.654, 0.709)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14f826af2eab4e98.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.362, 0.463) and point (0.152, 0.467), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.152, 0.467) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49f8ea622291fdc1.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.513, 0.450) or point (0.699, 0.573)?" }, { "from": "gpt", "value": "The point (0.513, 0.450) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/452d4175c50cd8d2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white fluffy insulation at left is smaller than white matte suit at center?" }, { "from": "gpt", "value": "Incorrect, white fluffy insulation at left is not smaller in size than white matte suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68d0c9ed12122f86.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of rustic wood bench at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.496, 0.802)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/200444f6badf6d72.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.696, 0.703) positioned in front of point (0.066, 0.023)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6bc3ee4500d261c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green leafy tree at upper left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.032, 0.237)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9027aec56705c04a.jpg", "conversations": [ { "from": "human", "value": "\nPoint to yellow satin saree at center.Point to the yellow satin saree at center in the image." }, { "from": "gpt", "value": "[(0.423, 0.673)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b8d5f6d3829566c.jpg", "conversations": [ { "from": "human", "value": "\nIs granite mountain at left smaller than greenish-blue water at center?" }, { "from": "gpt", "value": "Incorrect, granite mountain at left is not smaller in size than greenish-blue water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f04a30e8f6d187e.jpg", "conversations": [ { "from": "human", "value": "\nDoes black fabric at left have a greater height compared to black fabric man at lower left?" }, { "from": "gpt", "value": "In fact, black fabric at left may be shorter than black fabric man at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0399d1997c0d2b3d.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green matte plant at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.222, 0.603)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c126c12e7c868533.jpg", "conversations": [ { "from": "human", "value": "\nHow far is blue shirt at center from camera?" }, { "from": "gpt", "value": "blue shirt at center is 60.56 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2df1d52d0af108d9.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of green fabric tank top at center in the image." }, { "from": "gpt", "value": "[(0.547, 0.769)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46c630884b4bf1c3.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of velvety dark green leaf at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.276, 0.588)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc78fbafec04ee72.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte white shirt at center is smaller than green fabric skirt at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d836950fd0e3b5e.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.322, 0.244) come in front of point (0.965, 0.702)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2b3818fe3110a23.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect designing a new plaza and want to place a 36 inch wide statue between the white marble monument at center and the white marble statue at left. Is there enough space?" }, { "from": "gpt", "value": "The distance between the white marble monument at center and the white marble statue at left is 35.10 inches. Since the statue you want to place is 36 inches wide, it would not fit as the space is slightly narrower than required." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/954b0b9ba4fcdec2.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown matte wok at right have a lesser height compared to green smooth/woody green beans at left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3cab58b121feecaa.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the smooth concrete pavement at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.595, 0.880)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7c7f04121beeb01.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, matte black glasses at center or transparent plastic glasses at center, stands taller?" }, { "from": "gpt", "value": "Standing taller between the two is matte black glasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aca0f31b05aa9bd2.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the green glass tower at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.195, 0.486)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2befdbf25b47c9f9.jpg", "conversations": [ { "from": "human", "value": "\nLocate the velvet-like gray coat at center in the image." }, { "from": "gpt", "value": "[(0.325, 0.573)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b3984f2a78777e8.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a brown and white spotted cow at right. Pinpoint a point to the brown and white spotted cow at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.789, 0.625)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85b9d5f3376bf074.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer who wants to capture a clear shot of the man in the dark suit standing at point (0.502, 0.389). The camera you are using has a focal length of 50mm and an aperture of f2.8. Given that the point and the camera are 10.39 feet apart, what is the minimum distance you need to move closer to ensure the man is in focus if the depth of field at f2.8 allows for sharpness within 8 feet of the camera?" }, { "from": "gpt", "value": "The point (0.502, 0.389) is 10.39 feet away from the camera. Since the depth of field at f2.8 allows sharpness within 8 feet, the photographer needs to move closer so that the distance between the camera and the point is within 8 feet. Therefore, the minimum distance to move closer is 10.39 feet minus 8 feet, which equals 2.39 feet closer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/946626481b797cd0.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is yellow caution tape at center from orange reflective cone at left?" }, { "from": "gpt", "value": "A distance of 7.19 feet exists between yellow caution tape at center and orange reflective cone at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bbc23928dc91d599.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.603, 0.444) from camera?" }, { "from": "gpt", "value": "Point (0.603, 0.444) and camera are 2.83 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f8ee9fed2d1654f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at point (0.477, 0.411) and want to walk to the shore. The shore is 30.12 feet away from your current position. Can you estimate how many steps it would take to reach the shore if each of your steps is about 2.5 feet long?" }, { "from": "gpt", "value": "The distance to the shore is 30.12 feet, and each step is 2.5 feet. Dividing 30.12 by 2.5 gives approximately 12.05 steps. Therefore, you would need about 12 steps to reach the shore." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be32892c79f0c09f.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy cabbage at lower right appear on the left side of white cotton shirt at upper right?" }, { "from": "gpt", "value": "Yes, green leafy cabbage at lower right is to the left of white cotton shirt at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd34743419c0e95c.jpg", "conversations": [ { "from": "human", "value": "\nLocate the smooth bark tree at left in the image." }, { "from": "gpt", "value": "[(0.171, 0.136)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e88b6ca5ea328785.jpg", "conversations": [ { "from": "human", "value": "\nIs gray hoodie at left to the left of neon yellow hair at center from the viewer's perspective?" }, { "from": "gpt", "value": "Correct, you'll find gray hoodie at left to the left of neon yellow hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/833329ab971de3f6.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the concrete bridge at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.472, 0.723)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/409423af42ef8ab1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the camouflage uniform at center and the white fabric sandbags at lower right in a single shot. Based on their positions, which object should you focus on first to ensure both are in frame?" }, { "from": "gpt", "value": "The camouflage uniform at center is located above the white fabric sandbags at lower right, so you should focus on the camouflage uniform at center first to ensure both are in frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9cade0b02865db0.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.304, 0.664) and point (0.543, 0.588), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.543, 0.588)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bc56629bc39f4dc.jpg", "conversations": [ { "from": "human", "value": "\nCould you provide the distance between white cotton shirt at center and brown charred meat at center?" }, { "from": "gpt", "value": "white cotton shirt at center and brown charred meat at center are 10.11 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4dd67436c1dd1138.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to enter the building. You see two doors at the entrance, a green glass door at center and a green matte door at center. Which door should you use to enter the building?" }, { "from": "gpt", "value": "The green matte door at center is larger than the green glass door at center, so you should use the green matte door at center to enter the building since it is more likely to be the main entrance." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/909559bb97bb3dea.jpg", "conversations": [ { "from": "human", "value": "\nLocate brown textured building at center in the image." }, { "from": "gpt", "value": "[(0.148, 0.400)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b69ea5452824962.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear blue water at center come in front of green leafy tree at center?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65b538330f92727a.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow cardboard tubes at center thinner than yellow cardboard cup at center?" }, { "from": "gpt", "value": "In fact, yellow cardboard tubes at center might be wider than yellow cardboard cup at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0e0084f7705bb42.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a photo shoot and need to arrange two white satin items in the scene. The items are the white satin dress at center and the white satin shirt at upper right. Based on their sizes, which item should be placed closer to the camera to ensure both appear proportionally balanced in the final image?" }, { "from": "gpt", "value": "The white satin dress at center is smaller in size compared to the white satin shirt at upper right. To achieve proportional balance, the smaller white satin dress at center should be placed closer to the camera while the larger white satin shirt at upper right can be positioned slightly farther back. This way, their sizes in the photograph will appear more balanced." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb2d7e4b3be2368c.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the white cloth table at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.660, 0.639)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/637063c758690fe9.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fondant cake at center appear on the left side of white fleece vest at center?" }, { "from": "gpt", "value": "Correct, you'll find white fondant cake at center to the left of white fleece vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c7cafc9bff40fff.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the black suit at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.244, 0.678)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23e951eeee9bce80.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.863, 0.602) come closer to viewer compared to point (0.620, 0.994)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96caf6093022c340.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light blue fabric at upper right is taller than matte black portrait at left?" }, { "from": "gpt", "value": "Correct, light blue fabric at upper right is much taller as matte black portrait at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/beb508f0e778acbc.jpg", "conversations": [ { "from": "human", "value": "\nCould you provide the distance between green grass at lower center and polished gray statue at center?" }, { "from": "gpt", "value": "green grass at lower center is 3.26 meters from polished gray statue at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b630773e575c64e4.jpg", "conversations": [ { "from": "human", "value": "\nHow distant is white fleece jacket at center from black plastic sunglasses at upper center?" }, { "from": "gpt", "value": "The distance of white fleece jacket at center from black plastic sunglasses at upper center is 3.80 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e6bca9cbdf53bd5.jpg", "conversations": [ { "from": "human", "value": "\nDoes red fleece hoodie at center have a larger size compared to multicolored plastic goggles at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f519b8d239ce1d35.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, leather jacket at center or purple glossy bicycle at left?" }, { "from": "gpt", "value": "Positioned to the left is purple glossy bicycle at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6c888129384f4d9.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing items on a desk and need to place a new object between the white plastic building at center and the clear glass window at upper center. Considering their widths, which object should be placed closer to the edge of the desk to ensure there is enough space?" }, { "from": "gpt", "value": "The white plastic building at center has a lesser width compared to the clear glass window at upper center, so the white plastic building at center should be placed closer to the edge of the desk to leave more space for the wider clear glass window at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ba857e7c8201770.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow lined paper at upper center have a lesser height compared to pastel-colored handwriting at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ac2941e0398bce3.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.271, 0.839) and want to take a photo of the two boys sitting on the tree branch. How far do you need to move towards the camera to be in the correct position?" }, { "from": "gpt", "value": "You need to move 1.32 meters towards the camera to be in the correct position because the point (0.271, 0.839) and the camera are 1.32 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/033358a3f7f9b9fc.jpg", "conversations": [ { "from": "human", "value": "\nYou are a medical professional examining the smooth skin foot at center and the smooth orange toe at center. Which of these two has a greater height?" }, { "from": "gpt", "value": "The smooth skin foot at center is taller than the smooth orange toe at center according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d25fcce9fa88a56.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.259, 0.692) from camera?" }, { "from": "gpt", "value": "They are 3.56 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57cbf65fc3fd8a9a.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, wooden microwave at upper right or clear glass jar at right?" }, { "from": "gpt", "value": "clear glass jar at right is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eeb187a7163618fe.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.810, 0.602) or point (0.095, 0.484)?" }, { "from": "gpt", "value": "Point (0.810, 0.602) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bd2b72b89d6ca58.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a striped sweater at center. Pinpoint a point to the striped sweater at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.264, 0.683)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dade0124195d2fd6.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of turquoise glossy water at center in the image." }, { "from": "gpt", "value": "[(0.261, 0.728)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39cd628e37647ad4.jpg", "conversations": [ { "from": "human", "value": "\nPoint to matte black vest at center.Point to the matte black vest at center in the image." }, { "from": "gpt", "value": "[(0.622, 0.373)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c87db3b1fca5e10.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, brown fur otter at center or shaggy brown otter at upper right, stands shorter?" }, { "from": "gpt", "value": "With less height is shaggy brown otter at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/629b7f8fd69a1b45.jpg", "conversations": [ { "from": "human", "value": "\nYou are a wildlife photographer observing two herons in a wetland. You notice the white smooth heron at center and the white feathered bird at center. Which heron should you focus on if you want to capture the larger bird in your shot?" }, { "from": "gpt", "value": "The white feathered bird at center is larger than the white smooth heron at center, so you should focus on the white feathered bird at center to capture the larger bird in your shot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2223c74948926cad.jpg", "conversations": [ { "from": "human", "value": "\nYou are a stagehand preparing to set up equipment for the next act. You need to place a new microphone stand to the left of the existing black plastic microphone at upper center. Where should you position it relative to the metallic silver microphone at right?" }, { "from": "gpt", "value": "The metallic silver microphone at right is positioned on the right side of the black plastic microphone at upper center. Therefore, placing the new microphone stand to the left of the black plastic microphone at upper center would mean positioning it to the left of the metallic silver microphone at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3cf38a879733479e.jpg", "conversations": [ { "from": "human", "value": "\nDoes glistening water at center appear under wooden bench at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55b29bae494f85a7.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.431, 0.420) or (0.072, 0.066)?" }, { "from": "gpt", "value": "Positioned in front is point (0.431, 0.420)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bf4da6562e279c8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the perfect shot of the two people playing catch. You notice the white matte ball at center and the light green cotton shirt at left. Which object should you focus on if you want to capture the larger subject in your frame?" }, { "from": "gpt", "value": "The white matte ball at center is larger in size than the light green cotton shirt at left, so focusing on the white matte ball at center will capture the larger subject." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec9f830e478c7c9b.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center have a greater height compared to blue cotton shirt at center-right?" }, { "from": "gpt", "value": "Correct, green grass at center is much taller as blue cotton shirt at center-right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3eda367f4d2a3022.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.814, 0.844) to camera." }, { "from": "gpt", "value": "A distance of 33.17 inches exists between point (0.814, 0.844) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13fc0778708f6e0d.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.463, 0.242) in front of point (0.194, 0.247)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d3338a27bae0c73.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.620, 0.711) positioned after point (0.998, 0.608)?" }, { "from": "gpt", "value": "No, it is in front of (0.998, 0.608)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60b5db3eda56487b.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a brown suede jacket at center. Pinpoint a point to the brown suede jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.720, 0.519)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7bda69e7d3284592.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, matte black vest at center or translucent glass beverage at lower left?" }, { "from": "gpt", "value": "Positioned higher is matte black vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b76d8bf1383ee944.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any brown wooden bench at center-right in the image." }, { "from": "gpt", "value": "[(0.717, 0.556)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/678fb68127166577.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of green leafy mountain at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.485, 0.145)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d69f97a2465537a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, matte green vase at left or speckled glass vase at center?" }, { "from": "gpt", "value": "speckled glass vase at center is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f265c35975f29f53.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth gray bench at center is positioned to the left of smooth gray stone bench at lower left?" }, { "from": "gpt", "value": "No, smooth gray bench at center is not to the left of smooth gray stone bench at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/954262cdcafd6d32.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of bronze statue at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.494, 0.717)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9fa3d2375708083.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.036, 0.841) and camera?" }, { "from": "gpt", "value": "Point (0.036, 0.841) and camera are 1.11 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e067427ec6cca80d.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at upper center shorter than green leafy tree at upper right?" }, { "from": "gpt", "value": "No, green leafy tree at upper center is not shorter than green leafy tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/992a259827cd406a.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, white matte building at center or black wire at upper center?" }, { "from": "gpt", "value": "white matte building at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cfc11801e2dc0f6.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.930, 0.605) farther from viewer compared to point (0.112, 0.230)?" }, { "from": "gpt", "value": "No, (0.930, 0.605) is in front of (0.112, 0.230)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b78554d9bceb1e18.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of black striped shirt at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.790, 0.694)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f0315c201ce479a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the hallway and see the green matte hat at upper left and the black felt hat at upper center. Which hat is positioned higher up in the image?" }, { "from": "gpt", "value": "The green matte hat at upper left is positioned higher up than the black felt hat at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40060af0ae16ccce.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person with a cart that is 10 feet wide. You need to navigate between the white fabric umbrella at center and the white fabric umbrella at left. Can your cart fit through the space between them?" }, { "from": "gpt", "value": "The distance between the white fabric umbrella at center and white fabric umbrella at left is 30.55 feet. Since your cart is only 10 feet wide, it can easily fit through the space between them as the distance is more than sufficient." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/381e901d8dcabf24.jpg", "conversations": [ { "from": "human", "value": "\nYou are driving a car and see the image on your dashboard camera. There is a point at coordinates (0.574, 0.441) in the image. How far is that point from your car?" }, { "from": "gpt", "value": "The point at coordinates (0.574, 0.441) is 38.29 feet away from the camera, so it is 38.29 feet away from your car." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f29022617b391244.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.757, 0.539) or (0.977, 0.445)?" }, { "from": "gpt", "value": "Point (0.977, 0.445)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5864bd962a794c2d.jpg", "conversations": [ { "from": "human", "value": "\nHow close is shiny brown fur at left from camera?" }, { "from": "gpt", "value": "shiny brown fur at left is 5.35 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24dd05b7b55feddd.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room and want to take a photo of the transparent glass window at upper center using a camera. The camera requires a minimum distance of 10 feet to focus properly. Is the distance between you and the window sufficient for the camera to focus?" }, { "from": "gpt", "value": "The transparent glass window at upper center and camera are 15.55 feet apart from each other. Since the minimum required distance is 10 feet, the distance is sufficient for the camera to focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33fb6299ef2a6b60.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a blue fabric flag at center. Pinpoint a point to the blue fabric flag at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.366, 0.377)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05a77954a480e67b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the blue fleece jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.355, 0.497)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20ea87fb671ddfd2.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of matte blue umbrella at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.374, 0.597)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6508bf6d71d46160.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between golden brown flaky pastry at lower center and camera?" }, { "from": "gpt", "value": "golden brown flaky pastry at lower center is 1.46 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bce27abf26b8a0dc.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the circular concrete platform in front of the rustic building. You see a green leafy tree at upper right and a green leafy plant at lower center. Which of these two plants is taller?" }, { "from": "gpt", "value": "The green leafy plant at lower center is taller than the green leafy tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc3265da1893c204.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte black hat at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.486, 0.566)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8de422db3fc42798.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a teal wooden boat at center. Pinpoint a point to the teal wooden boat at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.508, 0.680)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15f3946b55140509.jpg", "conversations": [ { "from": "human", "value": "\nWhere is yellow matte ambulance at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.598, 0.487)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cec5a087a5c4b51a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked by the coordinates point (0.312, 0.631) in a military cemetery. You want to place a wreath at the base of the central evergreen tree. How far do you need to walk to reach the tree?" }, { "from": "gpt", "value": "You need to walk 12.69 meters to reach the central evergreen tree from point (0.312, 0.631)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6b270d0e22ccd69.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a candid shot of both the dark blue sweater at center and the dark blue jacket at center. Since you want to ensure both subjects are fully in frame, you need to know which one is wider. Which clothing item has a greater width?" }, { "from": "gpt", "value": "The dark blue sweater at center has a greater width than the dark blue jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/783585f2a524b389.jpg", "conversations": [ { "from": "human", "value": "\nIs black and white striped jersey at center wider than gold polished trophy at upper center?" }, { "from": "gpt", "value": "Yes, black and white striped jersey at center is wider than gold polished trophy at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fd480ee9891d2fe.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black matte box at upper center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.669, 0.294)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcfdca2a247a550c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the edge of the event area. You want to take a photo of the white plastic chairs at center and the white shirt at center so that both are clearly visible. However, you notice that one object is much taller than the other. Which object will appear larger in the photo?" }, { "from": "gpt", "value": "The white plastic chairs at center will appear larger in the photo because they are much taller than the white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/282ec8c27b390a84.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from matte black pants at lower left to camera." }, { "from": "gpt", "value": "The distance of matte black pants at lower left from camera is 7.33 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03c441230e65c2c4.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue denim jeans at left have a greater width compared to gray heathered t-shirt at center?" }, { "from": "gpt", "value": "No, blue denim jeans at left is not wider than gray heathered t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8ab77a064b09189.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of dark brown leather jacket at lower left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.100, 0.795)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4091f407dcdbbcbc.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the water and want to walk to the green leafy tree at upper center. Which direction should you head relative to the green grass at lower left?" }, { "from": "gpt", "value": "The green leafy tree at upper center is positioned on the left side of green grass at lower left, so you should head to the left relative to the green grass at lower left to reach the tree." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be46177ed8693c0b.jpg", "conversations": [ { "from": "human", "value": "\nBetween brown stone bridge at upper center and matte white pants at upper center, which one has less height?" }, { "from": "gpt", "value": "matte white pants at upper center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51e52761e0bbe29d.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of pink fabric dress at lower center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.615, 0.708)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c298c89f1d388fa.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white matte shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.567, 0.539)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c1b4e8719526eed.jpg", "conversations": [ { "from": "human", "value": "\nYou are moving the white plastic desktop computer at center to a smaller desk. Based on the scene, will the wooden table at center have enough space to accommodate the computer after moving it?" }, { "from": "gpt", "value": "The wooden table at center is bigger than the white plastic desktop computer at center, so yes, the wooden table at center has enough space to accommodate the computer after moving it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce8da2aed14ce085.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy vineyard at center to the right of green plastic fence at center from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, green grassy vineyard at center is not on the right side of green plastic fence at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42b56605badfb390.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.801, 0.898) or point (0.068, 0.884)?" }, { "from": "gpt", "value": "Positioned behind is point (0.068, 0.884)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6462cdfc70a36cea.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.160, 0.747) closer to viewer compared to point (0.759, 0.267)?" }, { "from": "gpt", "value": "Yes, point (0.160, 0.747) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a9654f685d02148.jpg", "conversations": [ { "from": "human", "value": "\nWhat does the point at coordinates (0.907, 0.641) represent in the image?" }, { "from": "gpt", "value": "The point at coordinates (0.907, 0.641) indicates the green leafy hedge at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d5d1927837dd1c9.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte tank top at center wider than white fabric shirt at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de1577a0e09ca347.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.232, 0.906)?" }, { "from": "gpt", "value": "silver metallic laptop at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d2f4b3215be40e8.jpg", "conversations": [ { "from": "human", "value": "\nLocate all white dotted jacket at right in the image." }, { "from": "gpt", "value": "[(0.824, 0.361)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d65d2e6bb0b6d904.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of matte blue shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.510, 0.525)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35b50283a566001e.jpg", "conversations": [ { "from": "human", "value": "\nBased on the scene description, what object is located at the coordinates point (0.307, 0.686)?" }, { "from": "gpt", "value": "The brown matte skin at center is located at point (0.307, 0.686)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eab182ddf78e5737.jpg", "conversations": [ { "from": "human", "value": "\nCould you provide the distance between gray stone church at center and green leafy tree at right?" }, { "from": "gpt", "value": "A distance of 9.54 meters exists between gray stone church at center and green leafy tree at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4c878c47c470b08.jpg", "conversations": [ { "from": "human", "value": "\nHow much distance is there between matte white shirt at center and green leafy hedge at lower center?" }, { "from": "gpt", "value": "They are 46.07 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c1d0216b82a42af.jpg", "conversations": [ { "from": "human", "value": "\nLocate beige cotton shirt at center in the image." }, { "from": "gpt", "value": "[(0.852, 0.561)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd046d3db6512dd5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in front of the brick building. You want to take a photo that includes both the point at position (0.306, 0.572) and the point at position (0.490, 0.906). Which point should you focus on to ensure both are in sharp focus?" }, { "from": "gpt", "value": "You should focus on the point at position (0.306, 0.572) because it is closer to the camera than the point at position 0.909, 0.490. By focusing on the closer point, the depth of field will likely include both points in sharp focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32ac0b66a7d08de3.jpg", "conversations": [ { "from": "human", "value": "\nYou are moving into a new apartment and need to know where to place your new microwave. The microwave is 18 inches tall. You see the white matte dryer at left and the white matte dishwasher at left in the kitchen. Can you determine if there is enough vertical space between them to place the microwave?" }, { "from": "gpt", "value": "The white matte dryer at left is located above the white matte dishwasher at left, so there is space between them. However, the exact vertical distance isn not provided, so we cannot confirm if it is sufficient for the 18 inch microwave." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0896f517f570815.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between black lace bikini at center and camera?" }, { "from": "gpt", "value": "black lace bikini at center is 2.72 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49bf1a2c52cc9dd4.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.142, 0.072) positioned after point (0.169, 0.667)?" }, { "from": "gpt", "value": "No, (0.142, 0.072) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56b4fb5043c4b323.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.589, 0.680) or point (0.244, 0.689)?" }, { "from": "gpt", "value": "Point (0.589, 0.680)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce51786d43d4f489.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any black fabric shed at center in the image." }, { "from": "gpt", "value": "[(0.302, 0.439)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44534615e4f85e9f.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green uniform at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.986, 0.634)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/297dabb3afb7f364.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the metallic at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.487, 0.803)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0629a79f9143ae15.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person standing on the black asphalt at center. You need to place a package on the matte red blouse at center. Is the distance between them within your arm reach?" }, { "from": "gpt", "value": "The distance between the black asphalt at center and the matte red blouse at center is 7.04 feet, which is approximately 84.48 inches. Since an average human arm length is about 25 to 30 inches, the distance is too far to reach with your arm." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a336ba5576f49d87.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between pearl necklace at center and camera." }, { "from": "gpt", "value": "pearl necklace at center and camera are 5.27 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a03bb3350eafb50e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, purple woven sari at center or green leafy banana tree at right?" }, { "from": "gpt", "value": "green leafy banana tree at right is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0136956186c97a03.jpg", "conversations": [ { "from": "human", "value": "\nHow far is dark blue pool at center from camera?" }, { "from": "gpt", "value": "They are 25.03 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56fd8baa9e9879b5.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.170, 0.841) or (0.406, 0.286)?" }, { "from": "gpt", "value": "Point (0.170, 0.841) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b2383387ef8d007.jpg", "conversations": [ { "from": "human", "value": "\nDoes black cotton vest at center have a lesser height compared to black matte hand at center?" }, { "from": "gpt", "value": "Incorrect, black cotton vest at center's height does not fall short of black matte hand at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b39fd8bad15debca.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to place a picnic blanket between the green leafy tree at center and the matte black leather jacket at center. What is the minimum length of the picnic blanket needed to stretch between them?" }, { "from": "gpt", "value": "The green leafy tree at center and matte black leather jacket at center are 9.28 meters apart from each other, so the minimum length of the picnic blanket needed to stretch between them is 9.28 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c63302514bed58e.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.035, 0.756) from camera?" }, { "from": "gpt", "value": "Point (0.035, 0.756) is 81.55 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bbfe9430d15f8292.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.498, 0.973) positioned before point (0.292, 0.102)?" }, { "from": "gpt", "value": "Yes, point (0.498, 0.973) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1294e60c5db8146.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.751, 0.961) or point (0.447, 0.642)?" }, { "from": "gpt", "value": "Positioned behind is point (0.447, 0.642)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4f4ee09ec40f094.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of green fabric shirt at center in the image." }, { "from": "gpt", "value": "[(0.394, 0.294)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8896efc277a04b1.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte van at center to the left of denim jacket at center from the viewer's perspective?" }, { "from": "gpt", "value": "Yes, white matte van at center is to the left of denim jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e142ba65a6f276ba.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of brown textured stone clock tower at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.471, 0.744)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68c8428417361d67.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the bustling urban street scene in front of the large dome roof building. There are two points marked on the ground in front of you. The first point is at coordinate point(0.808, 0.787) and the second is at point(0.260, 0.509). If you want to walk towards the point that is closer to you, which coordinate should you head towards?" }, { "from": "gpt", "value": "You should head towards point(0.260, 0.509) because it is closer to you than point(0.808, 0.787), which is further away." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd1a7fed46d7e077.jpg", "conversations": [ { "from": "human", "value": "\nLocate the white matte flag at center in the image." }, { "from": "gpt", "value": "[(0.736, 0.580)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88005bde607d9718.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.826, 0.750) and point (0.529, 0.570), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.529, 0.570)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98af5f2bf30f7b88.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, green matte christmas tree at upper left or pink tulle dress at lower center?" }, { "from": "gpt", "value": "green matte christmas tree at upper left is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af1dc215fba89a99.jpg", "conversations": [ { "from": "human", "value": "\nLocate all shiny metallic bicycle at center in the image." }, { "from": "gpt", "value": "[(0.555, 0.617)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79521941d2b83458.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.319, 0.466) or (0.429, 0.350)?" }, { "from": "gpt", "value": "Point (0.319, 0.466)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/359ef87956d07910.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the concrete stairs at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.578, 0.534)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0788cbb0e7774500.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green grassy hillside at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.138, 0.709)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6ebfa3176c3ac23.jpg", "conversations": [ { "from": "human", "value": "\nIs blue water at lower left behind green grass at lower right?" }, { "from": "gpt", "value": "No, blue water at lower left is in front of green grass at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abe26b0cdada391c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the matte yellow hoodie at center and the dirt track at center in a single frame. Given that your camera can only focus on objects larger than 10 cm, will both objects be in focus?" }, { "from": "gpt", "value": "The dirt track at center is bigger than matte yellow hoodie at center, so the dirt track at center will be in focus. However, the matte yellow hoodie at center might be too small to be focused clearly if it is under 10 cm in size." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16d2525085c651c4.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.711, 0.256) less distant than point (0.292, 0.216)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.292, 0.216)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abca515a04e9b596.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.172, 0.508)?" }, { "from": "gpt", "value": "white matte/soft robe at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f02b323d2058755f.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.563, 0.530) from camera?" }, { "from": "gpt", "value": "Point (0.563, 0.530) is 26.20 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5380d5e285f23397.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.267, 0.819) or point (0.628, 0.292)?" }, { "from": "gpt", "value": "Point (0.267, 0.819) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9028c1a74db2b386.jpg", "conversations": [ { "from": "human", "value": "\nWhere is purple rubber tubes at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.637, 0.700)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7139b0509575f858.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position in the conference room scene. There is a point marked at coordinates point (0.422, 0.344). How far is that point from where you are standing?" }, { "from": "gpt", "value": "The point (0.422, 0.344) is 6.38 feet away from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23a53c3192ce89ac.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer planning to capture a landscape shot of the coastal town. You want to ensure both the green leafy tree at lower left and the green leafy tree at upper center are visible in your frame. Considering their heights, which tree might require you to adjust your camera angle more to include its full height?" }, { "from": "gpt", "value": "The green leafy tree at lower left has a greater height compared to the green leafy tree at upper center, so you would need to adjust your camera angle more to include its full height." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5dcc6b3e9fa5b15e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light beige suit at center is thinner than matte black hand at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afddabeb2261af5a.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a clothing display and need to arrange the white fabric shorts at lower left and the striped polo shirt at center according to their positions in the image. Which item should be placed to the right side of the display?" }, { "from": "gpt", "value": "The white fabric shorts at lower left should be placed to the right side of the display because, according to the description, the white fabric shorts at lower left is to the right of striped polo shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ebb31139e231f45.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of matte black jacket at center?" }, { "from": "gpt", "value": "A distance of 3.90 feet exists between matte black jacket at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6073363802c2e1db.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.074, 0.909) and point (0.708, 0.953), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.074, 0.909) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fc5700cd9c5b3a7.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, floral fabric shirt at center or black textured shirt at center?" }, { "from": "gpt", "value": "Positioned to the left is black textured shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab077d7f6b3b364c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of matte brown t-shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.304, 0.695)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58ed7a5c29888c91.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a photo shoot and need to place a backdrop behind the two people in the image. The backdrop is 1.8 meters wide. The patterned knit dress at center and the black shirt at left are positioned in front of the backdrop. Which person requires a wider backdrop to fully capture their clothing details without cropping?" }, { "from": "gpt", "value": "The patterned knit dress at center requires a wider backdrop since its width surpasses that of the black shirt at left, ensuring no details are cropped." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed2ca6611085ef77.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is shiny red sedan at left from shiny black sedan at left?" }, { "from": "gpt", "value": "shiny red sedan at left is 36.20 inches away from shiny black sedan at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5697278fd8e8caa.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth concrete pool at center appear on the right side of silvery reflective moon at upper left?" }, { "from": "gpt", "value": "Indeed, smooth concrete pool at center is positioned on the right side of silvery reflective moon at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a21982a815b4908.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.138, 0.798) closer to camera compared to point (0.493, 0.727)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.493, 0.727)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c050d1ed91ab1cb1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture both the orange printed shirt at center and the gray fleece sweatshirt at center in a single frame. Since you want to ensure both are clearly visible, which clothing item should you focus on first to ensure proper exposure, considering their sizes?" }, { "from": "gpt", "value": "The orange printed shirt at center is larger than the gray fleece sweatshirt at center, so you should focus on the orange printed shirt at center first to ensure proper exposure, as its larger size will require more attention to capture details accurately." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da0ea8b3b1685d4f.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.506, 0.509) and point (0.483, 0.452), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.506, 0.509) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6db1b8e6f61fde9.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the dark blue water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.059, 0.678)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23797b7b076155df.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of a park and see the black wood table at center and the white plastic helicopter at center. Which object is closer to you?" }, { "from": "gpt", "value": "The black wood table at center is closer to you because it is in front of the white plastic helicopter at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/066773c4d81d32d6.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between orange matte carrot at center and smooth brown onion at lower right?" }, { "from": "gpt", "value": "They are 2.43 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a776bfe9dd41b829.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.066, 0.561)?" }, { "from": "gpt", "value": "gray cotton shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60156d7066a8b068.jpg", "conversations": [ { "from": "human", "value": "\nIs asphalt track at center below matte black car at center?" }, { "from": "gpt", "value": "No, asphalt track at center is not below matte black car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83436908218ef948.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and want to capture a photo where both the shiny metallic costume at left and the matte black shirt at upper right are visible. Based on their positions, which object is closer to the camera?" }, { "from": "gpt", "value": "The shiny metallic costume at left is closer to the camera because it is in front of the matte black shirt at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e85de91d2f9d412.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any green leafy tree at upper right in the image." }, { "from": "gpt", "value": "[(0.864, 0.152)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3d6c39c3d7f2dd6.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the shiny chrome car at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.564, 0.884)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdb443f11321bd86.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.826, 0.423)." }, { "from": "gpt", "value": "multicolored painted buildings at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f34a52cd4e04b39c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.366, 0.631)?" }, { "from": "gpt", "value": "clear water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/014a6593575a4330.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the object located at the coordinates point (0.139, 0.506)?" }, { "from": "gpt", "value": "The object at point (0.139, 0.506) is a clear plastic speaker at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c95e7465cfb2220.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of blonde hair at upper right from khaki cotton baseball cap at center?" }, { "from": "gpt", "value": "blonde hair at upper right is 8.82 meters away from khaki cotton baseball cap at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e103995a8192872c.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the striped sweater at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.339, 0.605)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f05019ed18d4663e.jpg", "conversations": [ { "from": "human", "value": "\nYou are attending this meeting and need to locate the black matte suit at left and the green silk tie at right. Based on their positions, which one is closer to the center of the table?" }, { "from": "gpt", "value": "The black matte suit at left is positioned under the green silk tie at right, meaning it is closer to the center of the table than the green silk tie at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f76dd2a6265b321.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is green leafy tree at center from matte pink jacket at center?" }, { "from": "gpt", "value": "green leafy tree at center and matte pink jacket at center are 18.32 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba0804a0b5763a37.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte red tie at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.251, 0.655)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d710eb207922d435.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.800, 0.573) come behind point (0.424, 0.242)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d88f87774347670f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer at a bakery and want to order the teal frosting cupcake at center and the white matte icing at right. The cashier asks you to describe their positions relative to each other so they can locate them easily. How would you describe their positions?" }, { "from": "gpt", "value": "The teal frosting cupcake at center is located below the white matte icing at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b0b353dba88016b.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a photo shoot and need to ensure that the orange matte shirt at center and the matte black backpack at center are both visible in the frame. Considering their sizes, which object should you focus on to ensure both are captured without cropping?" }, { "from": "gpt", "value": "The orange matte shirt at center occupies less space than the matte black backpack at center, so focusing on the matte black backpack at center would ensure both objects are visible since it is larger and requires more space in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e7f59641148077c.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green glossy water at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.510, 0.798)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c69487ce203dacf4.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, black matte body at center or dark gray skin at left?" }, { "from": "gpt", "value": "With less height is dark gray skin at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9852e3e4e386f805.jpg", "conversations": [ { "from": "human", "value": "\nIs high visibility yellow safety vest at center further to the viewer compared to matte pink goggles at center?" }, { "from": "gpt", "value": "No, it is in front of matte pink goggles at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73343b7fbd259af5.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.625, 0.430) positioned after point (0.258, 0.678)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a4e4a0708542d0b.jpg", "conversations": [ { "from": "human", "value": "\nYou are a food stylist arranging a holiday plate. You have a translucent plastic hand at lower right and a transparent plastic hand at upper left. Which hand takes up more space on the plate?" }, { "from": "gpt", "value": "The transparent plastic hand at upper left takes up more space on the plate than the translucent plastic hand at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/562b2012b6144c37.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.576, 0.463)?" }, { "from": "gpt", "value": "Point (0.576, 0.463) and camera are 541.41 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/760b69f8d2046f93.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.489, 0.673)?" }, { "from": "gpt", "value": "black matte hand at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27531e039c1e38fa.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is white glossy tube of toothpaste at center from camera?" }, { "from": "gpt", "value": "white glossy tube of toothpaste at center and camera are 63.71 centimeters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2a6633cd7c5d024.jpg", "conversations": [ { "from": "human", "value": "\nIs dirt path at center further to the viewer compared to pink matte jacket at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfe6e7fc825069b6.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden gazebo at center have a lesser height compared to black backpack at lower right?" }, { "from": "gpt", "value": "Incorrect, wooden gazebo at center's height does not fall short of black backpack at lower right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/689a52f81c81cfdc.jpg", "conversations": [ { "from": "human", "value": "\nYou need to sit down in the scene and want to choose between the metallic gray chair at upper left and the white plastic chair at center. Which chair has a wider seat to sit on?" }, { "from": "gpt", "value": "The metallic gray chair at upper left is wider than the white plastic chair at center, so it has a wider seat to sit on." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f362bb1a398a9d36.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of brown rough bark tree trunk at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.458, 0.417)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a55d5e8ccdb12f37.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green grassy at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.512, 0.812)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e57460b3543f2bd1.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.240, 0.681) closer to camera compared to point (0.243, 0.872)?" }, { "from": "gpt", "value": "No, (0.240, 0.681) is further to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0a01073443c00dc.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white matte stripe at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.887, 0.455)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7cfb98d5f48b174.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of purple tulle dress at left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.113, 0.397)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbc870e47a39c622.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between dry grass at lower center and camera?" }, { "from": "gpt", "value": "They are 29.23 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e412e58ad53b3a14.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.727, 0.255)?" }, { "from": "gpt", "value": "glassy skyscraper at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10c70d59e9837038.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is red brick mansion at center from camera?" }, { "from": "gpt", "value": "red brick mansion at center and camera are 53.39 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a78fd648df08854a.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.535, 0.791) and camera?" }, { "from": "gpt", "value": "A distance of 1.38 meters exists between point (0.535, 0.791) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a29f8c3683ef2204.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.985, 0.184) from camera?" }, { "from": "gpt", "value": "6.51 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0f0f26fb6d6d53b.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.412, 0.342) come farther from viewer compared to point (0.247, 0.386)?" }, { "from": "gpt", "value": "No, (0.412, 0.342) is in front of (0.247, 0.386)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0a20a5a7466a21e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the black stone statue at center. If you want to take a photo of it from a distance where you can capture the entire statue and the sunset backdrop, would 6.29 meters be a suitable distance?" }, { "from": "gpt", "value": "The distance of the black stone statue at center from viewer is 6.29 meters. This distance should allow you to capture the entire statue and the sunset backdrop in your photo." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/328073820a6942ff.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white matte clipboard at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.286, 0.438)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/146c05096967a0d7.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.561, 0.903) or (0.355, 0.297)?" }, { "from": "gpt", "value": "Point (0.561, 0.903) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/724b8a0574de0e6b.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to take a boat ride and need to choose between the wooden boat at center and the wooden longboat at left. Which one can accommodate more passengers based on their sizes?" }, { "from": "gpt", "value": "The wooden boat at center has a larger size compared to wooden longboat at left, so it can accommodate more passengers." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/902b7881dc35681a.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of matte red jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.597, 0.770)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea41a093a4b475d4.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any green matte tree at center in the image." }, { "from": "gpt", "value": "[(0.508, 0.795)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d189cf7f2ebfedaa.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte airplane at center appear under camouflage-patterned rifle at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e8985af798c1830.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow matte shoe at center taller than yellow fabric hand at center?" }, { "from": "gpt", "value": "No, yellow matte shoe at center is not taller than yellow fabric hand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4cba941b1208364.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow fleece jacket at center is positioned below smooth black microphone at center?" }, { "from": "gpt", "value": "Indeed, yellow fleece jacket at center is positioned under smooth black microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d0cabe0f28b781f.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.686, 0.972) or (0.912, 0.995)?" }, { "from": "gpt", "value": "Point (0.912, 0.995)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d229f8750902d81b.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.441, 0.530)?" }, { "from": "gpt", "value": "pink blossoms at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9c883c66ef3aab6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at a viewpoint overlooking the canal scene. You want to take a photo of the point at coordinates point (0.511, 0.625) in the image. If your camera has a maximum focus range of 300 feet, will it be able to focus on that point?" }, { "from": "gpt", "value": "The distance of point (0.511, 0.625) from the camera is 298.60 feet, which is within the camera maximum focus range of 300 feet. Therefore, the camera can focus on that point." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5169b41f1afcf483.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of orange cotton shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.687, 0.812)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73287def7c222080.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red blouse at center to the right of red fabric flag at upper left from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, matte red blouse at center is positioned on the right side of red fabric flag at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08b66e6ba8510b17.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.547, 0.859)?" }, { "from": "gpt", "value": "clear plastic headlight at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a85e6d521ee1062.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point marked at coordinates (0.485, 0.522). How far do you need to walk to get there?" }, { "from": "gpt", "value": "The point marked at coordinates (0.485, 0.522) is 13.46 meters away from your current position at the camera, so you need to walk 13.46 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5413b68faeee837a.jpg", "conversations": [ { "from": "human", "value": "\nWhere is the gray stone statue at left located in the image?" }, { "from": "gpt", "value": "The gray stone statue at left is located at point (0.285, 0.623) in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/904c62dd3fef960d.jpg", "conversations": [ { "from": "human", "value": "\nIs green needle-like tree at left to the right of green matte evergreen tree at lower left from the viewer's perspective?" }, { "from": "gpt", "value": "Correct, you'll find green needle-like tree at left to the right of green matte evergreen tree at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/207667577a42fbd1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tourist standing on the left side of the brown stone palace at center. You want to take a photo of the French flag on top of the building while also capturing the greenish water at center in the reflection. Which direction should you face to include both the flag and the water in your shot?" }, { "from": "gpt", "value": "You should face to the right of the brown stone palace at center. Since the greenish water at center is to the right of the palace, facing that direction will allow you to capture both the French flag on top of the palace and its reflection in the greenish water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef3b6ab5715cc76e.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of green leafy tree at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.662, 0.533)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc4f6fe4d8026603.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.576, 0.873) or (0.686, 0.794)?" }, { "from": "gpt", "value": "Point (0.576, 0.873) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a5ddde38005ad98.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any smooth red bridge at center in the image." }, { "from": "gpt", "value": "[(0.553, 0.570)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb7bb6e1e1ae054b.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.323, 0.234) more distant than point (0.522, 0.794)?" }, { "from": "gpt", "value": "Yes, point (0.323, 0.234) is farther from viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/632ef4bea57f89fa.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at upper center is positioned to the left of charred seared steak at center?" }, { "from": "gpt", "value": "Correct, you'll find green grass at upper center to the left of charred seared steak at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e3d2bcacc2e8080.jpg", "conversations": [ { "from": "human", "value": "\nDoes green plastic boat at center have a greater width compared to silhouette human at center?" }, { "from": "gpt", "value": "Yes, green plastic boat at center is wider than silhouette human at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93f179153b5e8dd2.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, matte black shutters at left or matte black shutters at upper left?" }, { "from": "gpt", "value": "matte black shutters at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee353bff420c7d98.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the white cotton bib at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.733, 0.458)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/277cfcc5e721c33e.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between white smooth sand at center and green spiky plant at center?" }, { "from": "gpt", "value": "white smooth sand at center and green spiky plant at center are 3.54 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f54a9096b6201394.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, golden stone clock tower at center-right or golden stone spire at center?" }, { "from": "gpt", "value": "golden stone clock tower at center-right is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b01bf7781bd1ea40.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gray statue at center shorter than green fabric flag at upper center?" }, { "from": "gpt", "value": "Incorrect, matte gray statue at center's height does not fall short of green fabric flag at upper center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93135bf02116f6d7.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.015, 0.080) in the image. How far are you from the camera?" }, { "from": "gpt", "value": "You are 4.12 meters away from the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97960d318a4df179.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of orange scarf at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.596, 0.798)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16e77e7bd0a29b82.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth brown bark at right have a greater height compared to brown speckled eagle at center?" }, { "from": "gpt", "value": "Correct, smooth brown bark at right is much taller as brown speckled eagle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ff586270d5a3f41.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of satin burgundy dress at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.599, 0.767)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c41739327c9e85f.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between white fabric table at center and camera." }, { "from": "gpt", "value": "white fabric table at center is 15.36 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67ab36e9d72e1301.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any clear glass window at center in the image." }, { "from": "gpt", "value": "[(0.686, 0.353)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f736b34c8b9d5a8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if mahogany wood door at center is shorter than polished metal balustrade at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b432c5de6c6996d6.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between wooden table at center and camera." }, { "from": "gpt", "value": "A distance of 26.11 inches exists between wooden table at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d6d32291cf5d8c3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if striped cotton shirt at left is smaller than purple cotton shirt at center?" }, { "from": "gpt", "value": "Correct, striped cotton shirt at left occupies less space than purple cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5cf8968c9775df7.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who wants to measure the size of the tree trunks in the forest. If the brown rough bark at left is 1.2 meters wide, how wide is the brown rough bark at center?" }, { "from": "gpt", "value": "The brown rough bark at center is smaller than the brown rough bark at left, which is 1.2 meters wide. Therefore, the brown rough bark at center is less than 1.2 meters wide." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7804fb0fa1999a25.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the eagle and want to touch both points on the image. Which point should you reach for first, point (0.840, 0.052) or point (0.398, 0.245), to touch the one closer to you?" }, { "from": "gpt", "value": "Point (0.840, 0.052) is closer to you than point (0.398, 0.245), so you should reach for point (0.840, 0.052) first." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5117896f0ed5d134.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of a historic building with a crowd nearby. You notice someone with dark gray hair at upper right. How far are you from that person?" }, { "from": "gpt", "value": "You are 14.81 meters away from the dark gray hair at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d39eba7bb189645.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.485, 0.948) or (0.952, 0.762)?" }, { "from": "gpt", "value": "The point (0.952, 0.762) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b0d05a48963d9c5.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown crumbly food at lower left have a smaller size compared to matte white bowl at center?" }, { "from": "gpt", "value": "No, brown crumbly food at lower left is not smaller than matte white bowl at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ba126514f865b32.jpg", "conversations": [ { "from": "human", "value": "\nYou are in a kayak and want to reach a point marked at coordinates (0.358, 0.781). The kayak is 4 meters long. Can you reach that point without getting out of the kayak?" }, { "from": "gpt", "value": "The point at coordinates (0.358, 0.781) is 11.45 meters away from the camera. Since the kayak is 4 meters long, you can reach it without getting out as the distance is greater than the kayak length." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31509d77c398be31.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to place a small package between the gold polished brass lamp at left and the gold metallic pillow at left. The package is 45 centimeters long. Will it fit between them?" }, { "from": "gpt", "value": "The gold polished brass lamp at left and gold metallic pillow at left are 46.42 centimeters apart from each other. The package is 45 centimeters long, so it will fit between them with 1.42 centimeters of space remaining." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1956eae38447170d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a construction worker standing at point (0.355, 0.656) in the room. You need to reach the ladder leaning against the wall near the red door with glass panels. Is the ladder closer to you than the red door with glass panels?" }, { "from": "gpt", "value": "The ladder is closer to you than the red door with glass panels because the ladder is next to the point where you are standing." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff9025e0515644f5.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the pathway and want to take a photo of the fluffy pink blossoms at center and the light blue striped shirt at center. Which object should you zoom in more on to capture both in the frame?" }, { "from": "gpt", "value": "You should zoom in more on the light blue striped shirt at center because the fluffy pink blossoms at center are wider, so zooming in on the smaller object allows both to fit in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5dd6620fd54beed3.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any white matte truck at center in the image." }, { "from": "gpt", "value": "[(0.497, 0.650)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4f7feadfa088f82.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to build a small garden between the clear water at lower right and the brown gravel road at center. Which area has more space to accommodate plants?" }, { "from": "gpt", "value": "The clear water at lower right is larger in size than the brown gravel road at center, so the area near the clear water at lower right has more space for plants." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/282387bba02019f2.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of white fabric chair at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.589, 0.736)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8266462e03781731.jpg", "conversations": [ { "from": "human", "value": "\nWhat is located at the coordinates point (0.341, 0.739) in the image?" }, { "from": "gpt", "value": "The point (0.341, 0.739) corresponds to the multicolored fabric at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/404a54d41f20cdf0.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.540, 0.648)?" }, { "from": "gpt", "value": "black fluffy cat at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/787c601b98d8d107.jpg", "conversations": [ { "from": "human", "value": "\nPoint to weathered wood dock at center.Point to the weathered wood dock at center in the image." }, { "from": "gpt", "value": "[(0.629, 0.791)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9cf33a6974fe82e.jpg", "conversations": [ { "from": "human", "value": "\nWhere is leather jacket at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.335, 0.705)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5b11b13ec4db145.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red lollipop at center have a larger size compared to glossy red lollipop at center?" }, { "from": "gpt", "value": "Yes, matte red lollipop at center is bigger than glossy red lollipop at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94f971761905bbc5.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.104, 0.877) positioned in front of point (0.169, 0.559)?" }, { "from": "gpt", "value": "No, (0.104, 0.877) is further to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3b7bd0015bf4f86.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.402, 0.358) and point (0.559, 0.516), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.402, 0.358) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d4880a279b3a0c8.jpg", "conversations": [ { "from": "human", "value": "\nDoes black smooth water at center appear on the left side of smooth skin crowd at upper left?" }, { "from": "gpt", "value": "No, black smooth water at center is not to the left of smooth skin crowd at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de886cbbb03e675e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a visitor trying to board a boat. You see the wooden boat at center and the wooden at center. Which one is wider?" }, { "from": "gpt", "value": "The wooden boat at center is wider than the wooden at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9319256795ba453.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between green matte tree at center and green mossy mountain range at upper center?" }, { "from": "gpt", "value": "A distance of 158.47 meters exists between green matte tree at center and green mossy mountain range at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afca9392e473f2c1.jpg", "conversations": [ { "from": "human", "value": "\nDoes white frothy water at center have a greater width compared to dark rock cliff at upper center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/220d8423b8101be3.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and want to capture a photo of both the red fabric jacket at center and the matte red jacket at center. Which jacket should you focus on first if you want to include both in your frame without adjusting your camera angle?" }, { "from": "gpt", "value": "You should focus on the matte red jacket at center first because it is taller than the red fabric jacket at center, ensuring it fits within the frame when capturing both." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a23a737d9a1f9195.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, black checkered flag at upper left or red matte shirt at center?" }, { "from": "gpt", "value": "red matte shirt at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7b08b2f425f46a8.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the red plastic stool at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.600, 0.867)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcd332deca17526c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, green matte tree at center or brown textured tree at left?" }, { "from": "gpt", "value": "green matte tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6dcc06c733376cf.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.887, 0.806) and camera?" }, { "from": "gpt", "value": "Point (0.887, 0.806) is 6.85 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d8d39ae7303823a.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.969, 0.889) lie behind point (0.960, 0.153)?" }, { "from": "gpt", "value": "No, (0.969, 0.889) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c244f1ceb7c064d.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of white matte truck at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.732, 0.362)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f20f97e129f81268.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray fabric climbing harness at center have a greater height compared to brown leather jacket at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/272956235b312f0f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the front area of the building. You need to locate the black flagpole at right. In which direction should you look to find it?" }, { "from": "gpt", "value": "The black flagpole at right is located at point (0.924, 0.553) in 2D coordinates. Since you are at the center of the front area, you should look towards the right side to find it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc39455ec4393e08.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.594, 0.477) lie behind point (0.398, 0.861)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fbc364edc2f1d35.jpg", "conversations": [ { "from": "human", "value": "\nYou are a parking attendant who needs to fit a compact car into the remaining space between the black matte police car at center and the white glossy sedan at right. Based on their sizes, which vehicle should you position closer to the compact car to ensure it fits?" }, { "from": "gpt", "value": "The black matte police car at center is smaller than the white glossy sedan at right, so positioning the compact car closer to the black matte police car at center would provide enough space for it to fit." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9e2c534f4a77c48.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the blue t-shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.780, 0.800)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/004eade658984f5a.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.533, 0.670)?" }, { "from": "gpt", "value": "8.80 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b4334f2bd25ce37.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white glossy cruise ship at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.615, 0.552)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2213f3ea8af08b46.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, silvery reflective water at center or green leafy trees at center?" }, { "from": "gpt", "value": "Standing shorter between the two is green leafy trees at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2b921c08ced41b5.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.270, 0.930) closer to viewer compared to point (0.827, 0.713)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.827, 0.713)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efcb085f8a38e9bc.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of silver metallic microphone at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.731, 0.259)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be7150cdd22dcf34.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to adjust the lighting for a group photo. You notice the black matte shirt at center and the black matte jacket at left. Which one is covering part of the other?" }, { "from": "gpt", "value": "The black matte shirt at center is positioned over the black matte jacket at left, meaning the shirt is covering part of the jacket." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e931fda760b1e28.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black suit at center is wider than white glossy table at upper right?" }, { "from": "gpt", "value": "Yes, matte black suit at center is wider than white glossy table at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45d1c2a91b75640c.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green grass at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.655, 0.855)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d6b0350f57a35b3.jpg", "conversations": [ { "from": "human", "value": "\nYou are observing the sky scene and want to determine which of the two points, point (0.712, 0.903) or point (0.113, 0.800), is closer to you. Based on the description, which point is nearer?" }, { "from": "gpt", "value": "Point (0.712, 0.903) is closer to the viewer than point (0.113, 0.800)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c926d4c9eafb8397.jpg", "conversations": [ { "from": "human", "value": "\nIs brown leather jacket at center shorter than red-white-striped flag at left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1aec616f68155acd.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of purple soft fabric baby at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.475, 0.261)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14d8ee8fd378eea2.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.349, 0.872) come behind point (0.275, 0.230)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2786d9042de31544.jpg", "conversations": [ { "from": "human", "value": "\nLocate shiny black suit at left in the image." }, { "from": "gpt", "value": "[(0.178, 0.484)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b8331568986563c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in a room with large glass windows. You see a dark matte jacket at center. If you want to move closer to the jacket, which direction should you move relative to your current position?" }, { "from": "gpt", "value": "Since the dark matte jacket at center is located at point (0.621, 0.713) in the image, you should move towards the center of the room to get closer to it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ecc82b0dc37e216.jpg", "conversations": [ { "from": "human", "value": "\nIs red fabric flag at center positioned in front of red and white striped flag at left?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb25dd4b3ea9f90c.jpg", "conversations": [ { "from": "human", "value": "\nBased on the scene description, which object takes up more area in the image, the green leafy tree at upper center or the clear water at center?" }, { "from": "gpt", "value": "The clear water at center takes up more area than the green leafy tree at upper center because the green leafy tree at upper center occupies less space than clear water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7842434a26c4b82.jpg", "conversations": [ { "from": "human", "value": "\nYou are a surveyor measuring distances between structures in a coastal area. You observe the concrete at center and the gray concrete water at center. What is the distance between them?" }, { "from": "gpt", "value": "The distance between the concrete at center and the gray concrete water at center is 53.78 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97e3d73598637f4d.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the trade show booth and want to take a photo of the point at coordinates (0.440, 0.356). How far should you position yourself from the camera to capture this point in your shot?" }, { "from": "gpt", "value": "The point at coordinates (0.440, 0.356) is 3.32 meters away from the camera, so you should position yourself approximately 3.32 meters away from the camera to capture this point in your shot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ced1414334e4cf9.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, blue glossy water at center or white fabric canopy at center?" }, { "from": "gpt", "value": "From the viewer's perspective, blue glossy water at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02dde20a6bc9fbbb.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at point (0.460, 0.778) in the image. How far are you from the camera?" }, { "from": "gpt", "value": "The point (0.460, 0.778) is 29.09 meters away from the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26513366c3ef6a08.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of granite stairs at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.457, 0.805)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f54d9d4030a633ed.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.612, 0.736) farther from viewer compared to point (0.553, 0.603)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.553, 0.603)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6988888d1333345b.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of green stone monkey at center in the image." }, { "from": "gpt", "value": "[(0.329, 0.742)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66530b54fc693b93.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.919, 0.514)?" }, { "from": "gpt", "value": "gray rough wood at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20604021100f3c15.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.718, 0.403)?" }, { "from": "gpt", "value": "beige fabric jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80e7afd1e13d99bd.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of metallic silver car at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.022, 0.427)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3db5c4fac529740.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.283, 0.627) come farther from viewer compared to point (0.965, 0.486)?" }, { "from": "gpt", "value": "No, (0.283, 0.627) is in front of (0.965, 0.486)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74001e1e16fc7cac.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte shirt at center have a lesser height compared to black plastic sunglasses at center?" }, { "from": "gpt", "value": "No, white matte shirt at center is not shorter than black plastic sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/616a80093c70d5f5.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.750, 0.812) and point (0.444, 0.792), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.750, 0.812) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d7f0d1b2eeba311.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the origin point in the forest scene. There is a point located at coordinates (0.429, 0.128). Which object in the scene does this point belong to?" }, { "from": "gpt", "value": "The point at coordinates (0.429, 0.128) is on the camo fabric hammock at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1596ed7fc7aa7cc3.jpg", "conversations": [ { "from": "human", "value": "\nPoint to shiny black sedan at left.Point to the shiny black sedan at left in the image." }, { "from": "gpt", "value": "[(0.084, 0.552)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5781c99ee579839.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a photo of the two people in the center of the tent. The pink knitted sweater at center and the white matte shirt at center are both in frame. Since you want to ensure both are fully visible, which clothing item should you focus on adjusting the camera angle to accommodate its height?" }, { "from": "gpt", "value": "The pink knitted sweater at center is shorter than the white matte shirt at center, so you should adjust the camera angle to accommodate the shorter height of the pink knitted sweater at center to ensure both are fully visible." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45493e141f332789.jpg", "conversations": [ { "from": "human", "value": "\nLocate gold/black plaque at center in the image." }, { "from": "gpt", "value": "[(0.470, 0.458)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba9c73d84b7c32b8.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of pink matte tank top at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.511, 0.537)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d7e46e599c393aa.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.504, 0.892) and point (0.237, 0.938), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.237, 0.938) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0632f4a32b6ea317.jpg", "conversations": [ { "from": "human", "value": "\nLocate rusty wood pillar at center in the image." }, { "from": "gpt", "value": "[(0.543, 0.539)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8636b33833c5d801.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white plastic window at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.642, 0.695)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55c81dc90dd07156.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of dry grass at upper left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.290, 0.125)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ad1a6cf2bd6d1f2.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.678, 0.136) in front of point (0.913, 0.877)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/531fb99f63b8b943.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if pink shirt at left is positioned below white plastic chair at center?" }, { "from": "gpt", "value": "No, pink shirt at left is not below white plastic chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c212883974485fc.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a white stone church at upper center. Pinpoint a point to the white stone church at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.566, 0.655)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/644afa979b137598.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte plastic hand at center come behind smooth yellow shirt at upper center?" }, { "from": "gpt", "value": "No, green matte plastic hand at center is in front of smooth yellow shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57f87395038c2775.jpg", "conversations": [ { "from": "human", "value": "\nLocate all yellow matte backpack at center in the image." }, { "from": "gpt", "value": "[(0.605, 0.438)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0100d5897a742b22.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between green fuzzy jacket at center and camera." }, { "from": "gpt", "value": "green fuzzy jacket at center is 64.38 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9237e719f80e1774.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the camera position. You need to adjust your focus to capture the white cotton tank top at center clearly. What is the approximate distance you should set your camera focus to?" }, { "from": "gpt", "value": "The white cotton tank top at center is 15.99 feet away from the camera, so you should set the camera focus to approximately 16 feet to capture it clearly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/159324be8603d192.jpg", "conversations": [ { "from": "human", "value": "\nIs clear plastic glasses at center behind transparent plastic glasses at upper center?" }, { "from": "gpt", "value": "No, it is in front of transparent plastic glasses at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5ca40ad9d3436f1.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.413, 0.402) closer to viewer compared to point (0.621, 0.277)?" }, { "from": "gpt", "value": "Yes, point (0.413, 0.402) is in front of point (0.621, 0.277)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00113a6dc6c71b5e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.905, 0.455) positioned before point (0.795, 0.702)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03532ee5fa904e8d.jpg", "conversations": [ { "from": "human", "value": "\nWhere is yellowtexturedlicense plate at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.777, 0.713)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1638d6680b1db1d7.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.127, 0.691)?" }, { "from": "gpt", "value": "silver metallic jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf1a67850b077923.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between dark blue uniform at left and camera?" }, { "from": "gpt", "value": "They are 15.10 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e25aea84c1b9e3ea.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the black matte shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.883, 0.680)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06bc5d7d158dcf2a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the camera position. You want to take a photo of the blonde hair at center. How far should you move forward or backward to ensure the subject is in focus?" }, { "from": "gpt", "value": "The blonde hair at center and camera are 16.78 inches apart from each other. To ensure the subject is in focus, you should position yourself exactly 16.78 inches away from the blonde hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9fa28ea70c998528.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of striped hoodie at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.459, 0.508)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0004b337ac5dcf87.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is green cotton t-shirt at center from pink fleece sweatshirt at center?" }, { "from": "gpt", "value": "They are 33.40 centimeters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1acf7327cc2b4d69.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, matte blue cap at left or gray fabric shirt at center?" }, { "from": "gpt", "value": "matte blue cap at left is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/043c0c5692176463.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.478, 0.686)?" }, { "from": "gpt", "value": "shiny black jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1bbb908a599232a.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a white woven scarf at left. Pinpoint a point to the white woven scarf at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.172, 0.584)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4822a7071753177c.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between green water at lower center and camera." }, { "from": "gpt", "value": "green water at lower center is 39.73 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a66467de3f129cda.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the brown checkered suit at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.246, 0.786)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/966e8aaf5fbf7b03.jpg", "conversations": [ { "from": "human", "value": "\nYou are an interior designer observing the room. You notice the gray cotton shirt at upper center and the yellow fabric at left. Which of these two items would require more space to store if you were to place them in a closet?" }, { "from": "gpt", "value": "The gray cotton shirt at upper center is bigger than the yellow fabric at left, so it would require more space to store in the closet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8931c145e02f239c.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte black sweater at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.433, 0.492)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/515ac27ce9d5c353.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the pink matte shirt at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.658, 0.542)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/520cd5d650669d44.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.080, 0.436) closer to camera compared to point (0.308, 0.077)?" }, { "from": "gpt", "value": "Yes, point (0.080, 0.436) is in front of point (0.308, 0.077)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c340f0c344906fc8.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.401, 0.592) behind point (0.977, 0.908)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.977, 0.908)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd38c71ae6c14bbe.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the leather jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.103, 0.784)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/674475f1d4915051.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden at center have a greater height compared to white glossy ferry at center?" }, { "from": "gpt", "value": "Incorrect, wooden at center's height is not larger of white glossy ferry at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b27972eafc71167.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.680, 0.847) or (0.130, 0.872)?" }, { "from": "gpt", "value": "Positioned in front is point (0.680, 0.847)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe26a23c018151f7.jpg", "conversations": [ { "from": "human", "value": "\nYou are a construction worker standing at the edge of the construction site. You need to pick up the white matte shovel at center to continue your work. However, you are currently holding the multicolored fabric shirt at center. Can you reach the shovel without letting go of the shirt?" }, { "from": "gpt", "value": "The multicolored fabric shirt at center and white matte shovel at center are 4.40 feet apart. Since the distance between them is greater than the typical arm length of a person, you cannot reach the shovel while holding the shirt." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70a06e8d2884d270.jpg", "conversations": [ { "from": "human", "value": "\nYou are driving a metallic blue car at center and want to know if you can see the smooth asphalt road at center clearly. Based on their positions, can you see the road ahead?" }, { "from": "gpt", "value": "The smooth asphalt road at center is closer to the viewer than the metallic blue car at center, so yes, you can see the road ahead clearly because it is nearer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/262f302b80b4c785.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny purple grapes at center is positioned to the right of green matte leaf at center?" }, { "from": "gpt", "value": "In fact, shiny purple grapes at center is to the left of green matte leaf at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89346588e92feef5.jpg", "conversations": [ { "from": "human", "value": "\nPoint to transparent gelatinous at center.Point to the transparent gelatinous at center in the image." }, { "from": "gpt", "value": "[(0.506, 0.492)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0888fbfc42ff87ea.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is green water at lower center from camera?" }, { "from": "gpt", "value": "A distance of 33.45 meters exists between green water at lower center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7972417711d6bcf.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the building and notice two fabrics in the scene. The dark fabric at center and the black fabric crowd at center. Which fabric is closer to you?" }, { "from": "gpt", "value": "The dark fabric at center is closer to the viewer than the black fabric crowd at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1661e6b87cfe68a1.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, green leafy willow at center or green grassy at lower center?" }, { "from": "gpt", "value": "Positioned higher is green leafy willow at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/507a3991bc46caa3.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a gray wool suit at right. Pinpoint a point to the gray wool suit at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.862, 0.680)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfbf29358cf9d76e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.746, 0.306) or point (0.593, 0.534)?" }, { "from": "gpt", "value": "The point (0.746, 0.306) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/468711456cd9d97d.jpg", "conversations": [ { "from": "human", "value": "\nIs brown wood pillar at center bigger than matte white stool at lower center?" }, { "from": "gpt", "value": "Actually, brown wood pillar at center might be smaller than matte white stool at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/574e2d3c8d8869f0.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the sculpture of a cow with scissors on its back. You notice a point marked at coordinates (0.460, 0.506). How far is this point from you?" }, { "from": "gpt", "value": "The point at (0.460, 0.506) is 11.76 feet away from the camera, so it is 11.76 feet away from you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61c073b5a2ca9858.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, metallic fountain at center or purple matte flower at center, stands taller?" }, { "from": "gpt", "value": "With more height is metallic fountain at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/827afc7916f4499f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the pedestrian area of this urban scene. You want to take a photo of the white stone tower at left. How far are you from the tower?" }, { "from": "gpt", "value": "The white stone tower at left and viewer are 197.10 feet apart from each other, so you are 197.10 feet away from the tower." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b24bcfe33de1d0f.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.076, 0.222) or point (0.894, 0.509)?" }, { "from": "gpt", "value": "Point (0.894, 0.509)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc19e0c3cdcb7294.jpg", "conversations": [ { "from": "human", "value": "\nYou are a costume designer trying to create a replica of the outfits seen in the image. You need to decide which object from the scene requires more horizontal space when laying it out on a table. Which one is wider between the teal fabric pants at center and the metallic silver headband at center?" }, { "from": "gpt", "value": "The teal fabric pants at center is wider than the metallic silver headband at center, so the teal fabric pants at center would require more horizontal space when laying out on a table." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/576307d665ba032d.jpg", "conversations": [ { "from": "human", "value": "\nWhere is gold chain link necklace at upper right located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.746, 0.247)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7421dc4357cca82.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.345, 0.498) and camera." }, { "from": "gpt", "value": "A distance of 3.55 feet exists between point (0.345, 0.498) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92b89a78b007c0b5.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the sidewalk in front of the red brick building. You see the red matte awning at center and the metallic silver car at center. Which object is closer to you?" }, { "from": "gpt", "value": "The red matte awning at center is closer to you because it is further to the viewer than the metallic silver car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/925d27686c9b8d24.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the orange cotton t-shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.350, 0.703)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20d0a000698ac460.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the silky beige dress at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.225, 0.598)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7c410d720f81a15.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.839, 0.433) come in front of point (0.324, 0.531)?" }, { "from": "gpt", "value": "No, (0.839, 0.433) is further to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1fa0a6f2d0ed8533.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of silver metallic ladder at upper right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.808, 0.753)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92bb8474603160c5.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the black satin suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.497, 0.673)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/508d2cdb40e1d7a9.jpg", "conversations": [ { "from": "human", "value": "\nWhere is smooth gray dolphin at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.701, 0.617)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26ee3f02edcc333a.jpg", "conversations": [ { "from": "human", "value": "\nIs concrete textured rail at lower center taller than metallic silver boat at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c203d91a3c4ae26.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the white cotton t-shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.639, 0.606)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c46e473c6ed6bbae.jpg", "conversations": [ { "from": "human", "value": "\nYou are a gardener standing at the edge of the green reflective water at lower left, and you want to trim the branches of the green leafy willow at left. Can you reach the branches without moving from your current position?" }, { "from": "gpt", "value": "The green leafy willow at left is 9.17 meters away from the green reflective water at lower left. Since the distance is too far, you cannot reach the branches from your current position without moving closer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d819b26059ccfd1.jpg", "conversations": [ { "from": "human", "value": "\nDoes white textured bed at center appear on the left side of printed fabric shirt at left?" }, { "from": "gpt", "value": "Incorrect, white textured bed at center is not on the left side of printed fabric shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/109bb9b0696f2143.jpg", "conversations": [ { "from": "human", "value": "\nCould you provide the distance between matte black portrait at upper right and matte black chair at center?" }, { "from": "gpt", "value": "The distance of matte black portrait at upper right from matte black chair at center is 3.79 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f3d70a2a3e76fc1.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of gray matte rhinoceros at center in the image." }, { "from": "gpt", "value": "[(0.638, 0.397)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5dc8c7c05d9553b3.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between shiny black monitor at center and camera." }, { "from": "gpt", "value": "51.09 centimeters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d6abef1c47d053b.jpg", "conversations": [ { "from": "human", "value": "\nBetween green leafy tree at upper right and yellow matte flower at lower left, which one has more height?" }, { "from": "gpt", "value": "With more height is green leafy tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf3a70c589e3ef8d.jpg", "conversations": [ { "from": "human", "value": "\nIs red velvet curtain at center positioned before white glossy table at lower right?" }, { "from": "gpt", "value": "No, it is behind white glossy table at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17bfc68b53f29553.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fabric bed at center appear on the left side of white soft pillow at upper left?" }, { "from": "gpt", "value": "No, white fabric bed at center is not to the left of white soft pillow at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9864c61fca7fcdde.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.674, 0.525) and point (0.740, 0.714), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.674, 0.525)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e22bfbcb64d849b4.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in a junkyard filled with old electronics. You notice two points marked in the scene. From your perspective, which point is closer to you? The points are labeled as point 1 at coordinates point (0.271, 0.809) and point 2 at coordinates point (0.106, 0.278)." }, { "from": "gpt", "value": "Point 1 at coordinates point (0.271, 0.809) is closer to you because it is in front of point 2 at coordinates point (0.106, 0.278)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a1e6e23ccdbcc94.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.628, 0.925)?" }, { "from": "gpt", "value": "smooth asphalt road at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bf058d6fe443996.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.408, 0.466) from camera?" }, { "from": "gpt", "value": "Point (0.408, 0.466) and camera are 8.85 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0a881a2b9210853.jpg", "conversations": [ { "from": "human", "value": "\nBetween black fabric at lower center and black plastic microphone at lower center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "Positioned to the left is black fabric at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68802b5a750a1c60.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.783, 0.698) come in front of point (0.869, 0.348)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3923a2872993757.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, matte silver showerhead at upper center or brushed metal faucet at lower left?" }, { "from": "gpt", "value": "matte silver showerhead at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e9a36ddb003293f.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the matte red shirt at right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.762, 0.631)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/259e32c7921c4159.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer aiming to capture the dancers in the center of the stage. You notice two skirts at the center, the shiny metallic skirt at center and the shiny orange fabric skirt at center. Which skirt should you focus on if you want to capture the larger one?" }, { "from": "gpt", "value": "The shiny orange fabric skirt at center is larger than the shiny metallic skirt at center, so you should focus on the shiny orange fabric skirt at center to capture the larger one." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af0137083052b946.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance measurement between white paperboard at center and clear glass bottle at center?" }, { "from": "gpt", "value": "white paperboard at center is 7.04 inches away from clear glass bottle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3561bd671ebcd85.jpg", "conversations": [ { "from": "human", "value": "\nIs green metallic sign at right shorter than green metallic sign at upper right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bad771d608ff9f1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden pole at center is thinner than yellow matte pole at center?" }, { "from": "gpt", "value": "No, wooden pole at center is not thinner than yellow matte pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5a8ebf58e826406.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, white metallic bus at center or matte black jacket at center, stands shorter?" }, { "from": "gpt", "value": "matte black jacket at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c8cc26d5071e692.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to plant a new tree in your backyard. The space you have is only suitable for plants that are smaller than the green grass at center. Can the green rough bark tree at center be planted there?" }, { "from": "gpt", "value": "The green rough bark tree at center has a larger size compared to green grass at center, so it cannot be planted in the space since it exceeds the size requirement." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a594f0243861cde1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a bus driver and you need to locate two children for a safety check. The children are wearing a gray cotton shirt at right and a white matte shirt at center. Which child is positioned more to the right side of the bus?" }, { "from": "gpt", "value": "The gray cotton shirt at right is positioned more to the right side of the bus compared to the white matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f7d75879476ff88.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any stone fireplace at center in the image." }, { "from": "gpt", "value": "[(0.383, 0.759)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65eca823d1fcb6c3.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any black stone figure at center in the image." }, { "from": "gpt", "value": "[(0.497, 0.512)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c29d8d1ce9d17dd.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.655, 0.694)?" }, { "from": "gpt", "value": "camouflage fabric hat at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c88aa2e5ca28766f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to determine if a tall package can fit between the teal matte shutters at center and the concrete at lower left. Which object is taller?" }, { "from": "gpt", "value": "The teal matte shutters at center is taller than the concrete at lower left, so the package can fit as long as its height does not exceed the height of the teal matte shutters at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afac5a5eee7fe085.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the interview scene. You need to ensure both the striped fabric shirt at center and the black matte microphone at center are clearly visible in your photo. Given their sizes, which object might require you to adjust your camera focus more carefully to avoid blurriness?" }, { "from": "gpt", "value": "The striped fabric shirt at center has a smaller size compared to the black matte microphone at center, so you might need to adjust the camera focus more carefully on the striped fabric shirt at center to ensure its details are clear." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd654e8c41a80cea.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the smooth concrete wall at lower center and want to reach the beige stone windmill at center. In which direction should you move?" }, { "from": "gpt", "value": "You should move to the right to reach the beige stone windmill at center since it is located to the left of the smooth concrete wall at lower center, meaning the wall is to the right of the windmill. Wait, this seems contradictory. Let me think again. If the windmill is to the left of the wall, then from the wall, the windmill is to the left. So to reach it from the wall, you should move left. Hmm, maybe I got confused. Let me clarify. The description says the windmill is to the left of the wall. So if you," } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90d4ee06c51f32a1.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the library and need to locate the matte black tablet at left. According to the coordinates provided, where exactly should you look?" }, { "from": "gpt", "value": "The matte black tablet at left is located at point coordinates (0.290, 0.470)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/633f8da59572110e.jpg", "conversations": [ { "from": "human", "value": "\nIs gray fleece jacket at center positioned at the back of yellow plastic toy car at lower center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e3ce2f4b4f0e7d0.jpg", "conversations": [ { "from": "human", "value": "\nLocate all green leafy tree at center in the image." }, { "from": "gpt", "value": "[(0.345, 0.192)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/798ddbe1295671e2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker trying to locate the sign for Clear Creek Canyon. You see the green grassy hillside at center and the green textured tree at upper right. Which direction should you look to find the sign?" }, { "from": "gpt", "value": "The green grassy hillside at center is to the left of the green textured tree at upper right, so the sign is likely located to the left of the green textured tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b98e7e5be3d7b9dc.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, light beige stone bell tower at center or white matte boat at lower right?" }, { "from": "gpt", "value": "Positioned to the left is light beige stone bell tower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e84d66f5b0cba75.jpg", "conversations": [ { "from": "human", "value": "\nYou are a maintenance worker needing to cross the metallic gray staircase at center to reach the other side of the railway tracks. However, there is a green leafy tree at center in the way. Can you pass through the space between them?" }, { "from": "gpt", "value": "The metallic gray staircase at center might be wider than green leafy tree at center, so there might be enough space to pass between them. However, since the exact width difference isn not specified, it is uncertain whether the space is sufficient for safe passage." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/367cbf01c5cd3a48.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.884, 0.784) and point (0.231, 0.688), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.884, 0.784) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eddfa73f76c0def1.jpg", "conversations": [ { "from": "human", "value": "\nYou are an art student who wants to take a photo of both the polished bronze reclining figure at center and the matte bronze statue at center in the same frame. Given that your camera has a maximum focal length of 50 meters, can you capture both subjects in a single shot without moving your position?" }, { "from": "gpt", "value": "The distance between the polished bronze reclining figure at center and the matte bronze statue at center is 22.78 meters. Since your camera can focus up to 50 meters, you can easily capture both subjects in one shot without moving." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/107998c0ff24b51e.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of white matte tower at left in the image." }, { "from": "gpt", "value": "[(0.278, 0.609)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e13486811f050ea3.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a photoshoot and need to arrange the models in a straight line from left to right. Given the current positions of the matte red dress at left and the floral fabric blouse at center, where should the third model wearing a gray top be placed to maintain a balanced line?" }, { "from": "gpt", "value": "The third model wearing the gray top should be placed to the right of the floral fabric blouse at center to maintain a balanced line, as the matte red dress at left is already positioned to the left of the floral fabric blouse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/acafa2ef91179425.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte purple sweater at center have a greater height compared to matte black hand at upper center?" }, { "from": "gpt", "value": "Correct, matte purple sweater at center is much taller as matte black hand at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ec5b12b53ecdba0.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.728, 0.711) come farther from viewer compared to point (0.937, 0.419)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0850bcdac48c1ee4.jpg", "conversations": [ { "from": "human", "value": "\nDoes light brown wooden bench at center have a lesser width compared to light brown fabric jacket at lower left?" }, { "from": "gpt", "value": "Indeed, light brown wooden bench at center has a lesser width compared to light brown fabric jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4818aded9e74617.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.728, 0.377) and point (0.202, 0.675), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.202, 0.675)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a5f4bfa37564a2a.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue cotton sweater at right have a greater height compared to gray matte sweater at left?" }, { "from": "gpt", "value": "Incorrect, blue cotton sweater at right's height is not larger of gray matte sweater at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adbb8449a8c866ab.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the matte green eye at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.238, 0.453)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e7e875ef06d93e7.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of patterned sweater at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.199, 0.606)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/beb456a53cf2a758.jpg", "conversations": [ { "from": "human", "value": "\nWhere is smooth concrete sidewalk at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.513, 0.894)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c211a6059d2e308.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange cotton shirt at center have a lesser height compared to black matte microphone at center?" }, { "from": "gpt", "value": "In fact, orange cotton shirt at center may be taller than black matte microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7a40c50a1d09827.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.249, 0.341)?" }, { "from": "gpt", "value": "yellow velvet curtains at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1022a7c27baba195.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the silvery reflective water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.508, 0.658)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a87b10b780dd7e6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the theater and want to know how far the point at coordinates point (0.812, 0.236) is from your current position. What is the distance?" }, { "from": "gpt", "value": "The point (0.812, 0.236) is 8.43 meters from the camera, so the distance from your current position is 8.43 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab55bd7f80026cbc.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.504, 0.659)?" }, { "from": "gpt", "value": "yellow weathered wood door at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9cd580a0bf890238.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of dark blue suit at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.854, 0.577)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82dffa644009b558.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer planning to take a photo of the white marble arch at center and the blue denim jeans at lower left. Which object should you focus on first if you want to capture both in a single frame without moving the camera?" }, { "from": "gpt", "value": "You should focus on the white marble arch at center first because it is larger in size than the blue denim jeans at lower left, so it will require more attention in the frame to ensure it is properly captured." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f440e5f928a676a.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.636, 0.603) lie in front of point (0.931, 0.688)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c7127befcbfb6d2.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.000, 0.970) and point (0.902, 0.430), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.000, 0.970) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82d37ee4493f79d6.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the dark gray shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.293, 0.623)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bdfe869e2dc9708.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fabric pants at center have a smaller size compared to wooden at center?" }, { "from": "gpt", "value": "Incorrect, white fabric pants at center is not smaller in size than wooden at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1da8b08bd85f7cf5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to place a package on the ground near the black cotton shirt at center. According to the image, where should you place the package in terms of coordinates?" }, { "from": "gpt", "value": "The package should be placed near the coordinates corresponding to the black cotton shirt at center, which is located at point (0.377, 0.581)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ec2117eff917877.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.651, 0.792) and point (0.464, 0.448), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.464, 0.448) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11c9e460edefd71e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, green fabric banner at center or black matte clipboard at center?" }, { "from": "gpt", "value": "black matte clipboard at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d304bb58b10d0f66.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the matte gray dome at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.681, 0.541)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0f73b13aa6efe67.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between black velvet robe at center and camera?" }, { "from": "gpt", "value": "The distance of black velvet robe at center from camera is 6.13 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f2a4d9842b05bb0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at center is positioned to the right of green grassy field at lower center?" }, { "from": "gpt", "value": "No, green leafy tree at center is not to the right of green grassy field at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c48fe32b8fa6475e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a candid shot of the softball game. You need to ensure that both the purple matte helmet at center and the purple matte baseball uniform at center are in focus. Given that your camera can only focus on objects within a 10 meter range, will both subjects be in focus?" }, { "from": "gpt", "value": "The purple matte helmet at center and the purple matte baseball uniform at center are 9.97 meters apart from each other. Since the distance between them is within the 10 meter range of the camera, both subjects will be in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42c2c95fcdda26fd.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, gray concrete pavement at lower center or black metal parking rack at right?" }, { "from": "gpt", "value": "black metal parking rack at right is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e57508a2bb2751e.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the matte black bicycle handlebars at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.637, 0.808)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a24b5404037c44b.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between matte white beam at left and clear glass window at center." }, { "from": "gpt", "value": "A distance of 26.77 feet exists between matte white beam at left and clear glass window at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c42163b9f015b1a.jpg", "conversations": [ { "from": "human", "value": "\nIs striped fabric top at center below white cotton polo shirt at right?" }, { "from": "gpt", "value": "Yes, striped fabric top at center is below white cotton polo shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b5eaa8b9498349f.jpg", "conversations": [ { "from": "human", "value": "\nYou are trying to decide which shirt to wear for an event. Both the dark gray shirt at center and the gray cotton shirt at upper center are options. Based on the image, which one is taller?" }, { "from": "gpt", "value": "The dark gray shirt at center is taller than the gray cotton shirt at upper center according to the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efa9132b9ac3b7d0.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the brown wooden guitar at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.206, 0.562)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc0c906005bfcc0a.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the white frosty snow at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.868, 0.706)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eaaac5e78d5fd9a4.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.480, 0.780) or point (0.440, 0.444)?" }, { "from": "gpt", "value": "Point (0.480, 0.780) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4cf8569ddd477a0.jpg", "conversations": [ { "from": "human", "value": "\nDoes metallic gray railing at center have a greater height compared to silver metallic sedan at center?" }, { "from": "gpt", "value": "Correct, metallic gray railing at center is much taller as silver metallic sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/127b2493a9ac8b08.jpg", "conversations": [ { "from": "human", "value": "\nPoint to white plastic drawer at lower center.Point to the white plastic drawer at lower center in the image." }, { "from": "gpt", "value": "[(0.304, 0.911)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02157642a0aaf3bb.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.260, 0.519) to camera." }, { "from": "gpt", "value": "A distance of 810.21 feet exists between point (0.260, 0.519) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03be88187ae1c273.jpg", "conversations": [ { "from": "human", "value": "\nYou are designing a garden layout and need to place a new decorative stone path. The path must be placed between the green grass at center and the green leafy plant at lower left. Which object should the path be closer to if it needs to accommodate a wider base?" }, { "from": "gpt", "value": "The path should be closer to the green grass at center because its width surpasses that of the green leafy plant at lower left, allowing more space for the wider base." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f69182206cdf8e61.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a group photo in the park. You notice the green striped dress at right and the white cotton shirt at left. Which clothing item should you position lower in your camera frame to ensure both are visible?" }, { "from": "gpt", "value": "The green striped dress at right is below the white cotton shirt at left, so you should position the green striped dress at right lower in the frame to ensure both are visible." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1419c34123614007.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between green glossy eye at center and camera?" }, { "from": "gpt", "value": "They are 24.13 centimeters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b363ca6c29186d1.jpg", "conversations": [ { "from": "human", "value": "\nPoint to white striped shirt at center.Point to the white striped shirt at center in the image." }, { "from": "gpt", "value": "[(0.878, 0.683)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfad952a6762b81b.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between high-visibility orange safety vest at left and striped shirt at center." }, { "from": "gpt", "value": "high-visibility orange safety vest at left is 1.44 meters away from striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9dee37c6e855128.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.612, 0.345) closer to camera compared to point (0.750, 0.314)?" }, { "from": "gpt", "value": "No, (0.612, 0.345) is behind (0.750, 0.314)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8b2bd84079e7063.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a smooth concrete sidewalk at center. Pinpoint a point to the smooth concrete sidewalk at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.566, 0.820)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a4b1793ac7ff93a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.503, 0.875)?" }, { "from": "gpt", "value": "brown dirt track at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b103c03d58c9fc0.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, black plastic video camera at left or fuzzy beige coat at upper left?" }, { "from": "gpt", "value": "With more height is fuzzy beige coat at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d444383db02feeb3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.309, 0.959) or point (0.243, 0.542)?" }, { "from": "gpt", "value": "Positioned in front is point (0.309, 0.959)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/896ac20bd3f1c9fe.jpg", "conversations": [ { "from": "human", "value": "\nIs dark blue jeans at center further to camera compared to dark brown leather jacket at lower center?" }, { "from": "gpt", "value": "Yes, dark blue jeans at center is further from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/886a4da449d64057.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from matte green bag at lower left to camera." }, { "from": "gpt", "value": "matte green bag at lower left is 11.50 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d945b6a2058f7e3a.jpg", "conversations": [ { "from": "human", "value": "\nIs brown leather sandal at lower left further to camera compared to brown leather sandal at lower center?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49c43f0c82dcd5b4.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.519, 0.591) from camera?" }, { "from": "gpt", "value": "A distance of 42.02 feet exists between point (0.519, 0.591) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29667c36986aa387.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the dining area and want to hand a napkin to the person wearing the green matte shirt at center. How far do you need to reach to place the napkin directly in front of them?" }, { "from": "gpt", "value": "The green matte shirt at center is 1.74 meters away from you, so you need to reach 1.74 meters to place the napkin directly in front of them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae3cc5bbfdb6a0ea.jpg", "conversations": [ { "from": "human", "value": "\nHow far apart are green leafy tree at upper center and brown soil at lower center?" }, { "from": "gpt", "value": "green leafy tree at upper center and brown soil at lower center are 12.62 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5846453041439228.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown wooden dock at center come behind blue cotton shirt at center?" }, { "from": "gpt", "value": "No, brown wooden dock at center is in front of blue cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3cb29c30d44b15fe.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a small event and need to place a decorative item on the table. The black matte jacket at lower right and the silver metallic microphone at upper right are both candidates. Which one takes up more space on the table?" }, { "from": "gpt", "value": "The black matte jacket at lower right is larger in size than the silver metallic microphone at upper right, so it takes up more space on the table." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35e5a31a7d656784.jpg", "conversations": [ { "from": "human", "value": "\nBetween tan uniform at center and green matte t-shirt at left, which one has less height?" }, { "from": "gpt", "value": "With less height is tan uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7024962d6b6a1f2d.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy motorcycle at center thinner than white matte shirt at center?" }, { "from": "gpt", "value": "No, white glossy motorcycle at center is not thinner than white matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34f6acf97880a13a.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.834, 0.494) and point (0.580, 0.227), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.834, 0.494)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7848e8773bf00400.jpg", "conversations": [ { "from": "human", "value": "\nBetween green silk saree at left and black sequined dress at center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "Positioned to the left is green silk saree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91bc4b79e608a8ba.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the showroom and want to take a photo of the satin blue car at center. The camera you are using has a focal length of 50mm and you are positioned at point A. The car is located at point B. If the coordinates of point A are given as x1,y1 and point B as x2,y2, what is the distance between you and the car in meters? Assume the showroom is a standard 10m x 10m space." }, { "from": "gpt", "value": "The coordinates of the satin blue car at center are provided as point B at (0.910, 0.259). However, without knowing the exact coordinates of point A where you are standing, it is impossible to calculate the distance between you and the car. Please provide the coordinates of point A to proceed with the calculation." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c1a31553140644e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.568, 0.530) closer to viewer compared to point (0.584, 0.388)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7a92edec7040314.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.881, 0.567) and point (0.003, 0.275), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.881, 0.567) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2b8378a2daf17b9.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of blue suit at right more distant than that of pink satin blouse at center?" }, { "from": "gpt", "value": "No, blue suit at right is in front of pink satin blouse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/baa7ad7cffb4f1e7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark blue suit at left is positioned above brown patterned tie at left?" }, { "from": "gpt", "value": "Correct, dark blue suit at left is located above brown patterned tie at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af55936d4dfcbeae.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.586, 0.816) come farther from viewer compared to point (0.815, 0.533)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e72bc9c5270f6b71.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.654, 0.614) from the camera?" }, { "from": "gpt", "value": "Point (0.654, 0.614) is 72.93 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f6fc6b9c01d652d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to blue woolen coat at right.Point to the blue woolen coat at right in the image." }, { "from": "gpt", "value": "[(0.758, 0.531)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16aa49c23ec5c219.jpg", "conversations": [ { "from": "human", "value": "\nDoes marble column at left appear on the right side of white marble bust at left?" }, { "from": "gpt", "value": "Correct, you'll find marble column at left to the right of white marble bust at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9405bd580cd908c4.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent water at lower center to the right of white matte boat at lower right from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, transparent water at lower center is not on the right side of white matte boat at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7acd6696908e953a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the workshop and need to hand a document to the person in the beige soft sweater at center without disturbing the person in the blue fabric shirt at left. Which direction should you approach from?" }, { "from": "gpt", "value": "The beige soft sweater at center is positioned under the blue fabric shirt at left, so you should approach from the right side to avoid the blue fabric shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84d6beecf6a60f34.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fleece jacket at center to the left of light blue cotton shirt at right from the viewer's perspective?" }, { "from": "gpt", "value": "Yes, blue fleece jacket at center is to the left of light blue cotton shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1769a90675a9e2a.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.017, 0.670) come farther from viewer compared to point (0.325, 0.844)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.325, 0.844)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b5bfeee27c11e24.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black notebook at center further to camera compared to yellow creamy food at center?" }, { "from": "gpt", "value": "No, matte black notebook at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06495eb3e0cf8b66.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any gray wool jacket at upper left in the image." }, { "from": "gpt", "value": "[(0.120, 0.234)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd5cad99821cd902.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.127, 0.464) and camera." }, { "from": "gpt", "value": "Point (0.127, 0.464) is 108.94 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1de20815fb89e355.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from green leafy tree at center to green leafy trees at center." }, { "from": "gpt", "value": "285.51 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad9dae2a05e4f53e.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of wooden paddle at center in the image." }, { "from": "gpt", "value": "[(0.808, 0.775)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15a3139f4bd1dc8d.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, gray cotton shirt at center or striped shirt at center?" }, { "from": "gpt", "value": "striped shirt at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/353ef2ed14f6c811.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a light gray sleeveless top at center. Pinpoint a point to the light gray sleeveless top at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.440, 0.564)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d56a53f048b23ccc.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the white glossy boat at upper center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.727, 0.241)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6aded03d1df19b2.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of white matte polo shirt at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.808, 0.239)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca584e166704c1bc.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer in the Mi Mi Lotus cafe and want to place a large tray between the wooden shelves at upper center and the black chalkboard at upper right. Considering their widths, will the tray fit horizontally between them?" }, { "from": "gpt", "value": "The wooden shelves at upper center are wider than the black chalkboard at upper right. Since the tray needs to fit horizontally between them, the total space available between the two objects would depend on their combined widths. However, without knowing the exact distance between them or the tray size, it is impossible to determine if it will fit. Please check the actual space or measure both objects." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dee7a44da86491ec.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of gray striped sweater at center in the image." }, { "from": "gpt", "value": "[(0.199, 0.289)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c268d533d8745288.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.673, 0.391) and point (0.332, 0.747), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.332, 0.747) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0b219c34af8afd6.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of antique brass trumpet at right less distant than that of black matte toy car at lower center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd1f9085b28c226f.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.390, 0.573) positioned in front of point (0.984, 0.545)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48d4b41a4bd32a77.jpg", "conversations": [ { "from": "human", "value": "\nBetween rubberized red slide at lower right and white matte/soft fabric at center, which one has less height?" }, { "from": "gpt", "value": "Standing shorter between the two is rubberized red slide at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a9b9e0702963f4e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, shiny yellow convertible at center or silver metallic convertible at center?" }, { "from": "gpt", "value": "Positioned to the left is shiny yellow convertible at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ad3228544faccff.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, light blue cotton shirt at center or white cotton shirt at center, stands taller?" }, { "from": "gpt", "value": "light blue cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c602c3b25bc137dc.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.377, 0.556) from camera?" }, { "from": "gpt", "value": "Point (0.377, 0.556) is 25.74 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51b49552fa37ba9b.jpg", "conversations": [ { "from": "human", "value": "\nBetween white glossy statue at center and white fabric at lower center, which one has more height?" }, { "from": "gpt", "value": "white glossy statue at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afff69b2e0474555.jpg", "conversations": [ { "from": "human", "value": "\nWhat does the point at coordinates (0.658, 0.639) indicate in the image?" }, { "from": "gpt", "value": "The point at coordinates (0.658, 0.639) marks the location of the brown stone tower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/652941f12f2cd58c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of green matte tank top at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.461, 0.809)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0b6e3ff5ace0277.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is green leafy palm tree at lower left from green leafy palm tree at center-left?" }, { "from": "gpt", "value": "The distance of green leafy palm tree at lower left from green leafy palm tree at center-left is 16.84 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7adcece40186812f.jpg", "conversations": [ { "from": "human", "value": "\nDoes white cotton t-shirt at center have a greater width compared to teal sweater at center?" }, { "from": "gpt", "value": "Yes, white cotton t-shirt at center is wider than teal sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96d560ac3080c7d7.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.199, 0.392) or point (0.877, 0.677)?" }, { "from": "gpt", "value": "The point (0.877, 0.677) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afb06808ed5aa517.jpg", "conversations": [ { "from": "human", "value": "\nBased on the scene described, which object is positioned to the right when observing the rusty metal bridge at center and green leafy shrubs at center?" }, { "from": "gpt", "value": "The rusty metal bridge at center is positioned to the right of the green leafy shrubs at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72ada929f1b4e036.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.833, 0.150) closer to viewer compared to point (0.284, 0.573)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.284, 0.573)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4c457c6bba97d0a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the historic town square and want to take a photo of both the clock tower and the Jo Pub sign. You notice two points marked on the ground at coordinates point (0.839, 0.673) and point (0.713, 0.323). Which point should you stand at to ensure both landmarks are visible in your photo without any obstructions?" }, { "from": "gpt", "value": "You should stand at point (0.713, 0.323) because point (0.839, 0.673) is in front of it, meaning standing at the latter would place you closer to the buildings and potentially block the view of the clock tower or Jo Pub sign. The point (0.713, 0.323) offers a better vantage point further back to capture both landmarks without obstruction." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8e51f5c92448991.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray t-shirt at center to the right of black plastic table at center from the viewer's perspective?" }, { "from": "gpt", "value": "Yes, dark gray t-shirt at center is to the right of black plastic table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3699a7327b46fc68.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of dirt road at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.488, 0.784)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/669f8496a5fc83e6.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white jersey at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.523, 0.567)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3b647143007c2f0.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the white matte vest at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.600, 0.681)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b39e451b061513e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point marked as point (0.906, 0.619). How far do you need to walk?" }, { "from": "gpt", "value": "You need to walk 4.68 meters to reach point (0.906, 0.619) from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1adc21eb3ca5bf68.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.638, 0.562) from camera?" }, { "from": "gpt", "value": "A distance of 1.01 meters exists between point (0.638, 0.562) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db4f26be8830f47b.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.787, 0.738) and point (0.564, 0.756), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.787, 0.738) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74ef1ca72eac1786.jpg", "conversations": [ { "from": "human", "value": "\nIs white wood chair at center to the right of black cotton shirt at left from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, white wood chair at center is positioned on the right side of black cotton shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b132a0f71f0e13d9.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the brown wooden deck at center and want to step onto the green grass at lower center. Is the distance between them short enough for you to step comfortably?" }, { "from": "gpt", "value": "The distance between the green grass at lower center and brown wooden deck at center is 3.76 feet. Since a comfortable stepping distance for an average person is typically around 2 to 3 feet, stepping might be a bit challenging but possible with caution." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f671430db31b2b6d.jpg", "conversations": [ { "from": "human", "value": "\nLocate blue glossy sports car at center in the image." }, { "from": "gpt", "value": "[(0.647, 0.527)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a64dda9370bc876.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.647, 0.716) from camera?" }, { "from": "gpt", "value": "Point (0.647, 0.716) is 151.86 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2cef9f58b11a4e84.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center behind shiny black dog at center?" }, { "from": "gpt", "value": "No, it is in front of shiny black dog at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7673fd413b889dc9.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the white printed shirt at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.758, 0.508)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3376df158b0e7262.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte jacket at left smaller than pink matte jacket at center?" }, { "from": "gpt", "value": "Actually, black matte jacket at left might be larger than pink matte jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ec5fd40a0cb02ba.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.465, 0.698) come closer to viewer compared to point (0.105, 0.208)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a638a7f9e9bfc64.jpg", "conversations": [ { "from": "human", "value": "\nYou are a bird flying over the garden scene. You want to land on the tallest object between the rusty stone lion at lower left and the green leafy palm tree at upper center. Which object should you choose?" }, { "from": "gpt", "value": "The green leafy palm tree at upper center is taller than the rusty stone lion at lower left, so you should land on the green leafy palm tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/214b2b6452bac00e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the snowy landscape and want to reach both the point at coordinates point(0.367, 0.864) and point(0.288, 0.391). Which point will you reach first as you move forward?" }, { "from": "gpt", "value": "You will reach point(0.367, 0.864) first because it is closer to you than point(0.288, 0.391)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60a21810cb83c6d6.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.441, 0.930) or point (0.350, 0.416)?" }, { "from": "gpt", "value": "Positioned in front is point (0.441, 0.930)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b767c79e2d04372.jpg", "conversations": [ { "from": "human", "value": "\nYou are trying to decide where to place the brown leather armchair at right and the white plastic robotic vacuum cleaner at center in the room. Which object has a smaller width?" }, { "from": "gpt", "value": "The brown leather armchair at right is thinner than the white plastic robotic vacuum cleaner at center, so the brown leather armchair at right has a smaller width." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/615fbb0a72460c38.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if bare branches at center is shorter than bare branches at upper center?" }, { "from": "gpt", "value": "Indeed, bare branches at center has a lesser height compared to bare branches at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea9e382873d95971.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green leafy tree at upper left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.210, 0.386)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ba7384df57aa22c.jpg", "conversations": [ { "from": "human", "value": "\nIs brown matte shirt at upper left bigger than plaid cotton shirt at center?" }, { "from": "gpt", "value": "Correct, brown matte shirt at upper left is larger in size than plaid cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f70a68911c9b3f0a.jpg", "conversations": [ { "from": "human", "value": "\nHow distant is black matte jacket at center from matte gray jacket at center?" }, { "from": "gpt", "value": "black matte jacket at center is 5.62 meters away from matte gray jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d76c741f00fd2c46.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of smooth skin face at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.532, 0.536)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40a407648f3c0b3e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in the urban scene. You want to capture a photo of the glassy steel tower at center without any people blocking it. Is the light blue sweater at center in a position that would block your view of the tower?" }, { "from": "gpt", "value": "The glassy steel tower at center is positioned over the light blue sweater at center, so the light blue sweater at center is directly in front of the tower. This means the sweater would block your view of the tower unless you move to a different angle or position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c3d50e7bcd36715.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red matte t-shirt at center is shorter than blue cotton polo shirt at left?" }, { "from": "gpt", "value": "Correct, red matte t-shirt at center is not as tall as blue cotton polo shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50466a3a48643e09.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.929, 0.662) less distant than point (0.567, 0.831)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.567, 0.831)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4131638cd9a0ed81.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up a camera at the back of the garden. You want to ensure both the green checkered suit at center and the blue checkered dress at center are fully visible in the photo. Which individual should you position closer to the camera to avoid one blocking the other?" }, { "from": "gpt", "value": "The green checkered suit at center is much taller than the blue checkered dress at center, so you should position the blue checkered dress at center closer to the camera to prevent the taller green checkered suit at center from blocking it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c5bec711cd1cc92.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point marked at coordinates point (0.185, 0.716). How far do you need to walk to get there?" }, { "from": "gpt", "value": "The point marked at coordinates point (0.185, 0.716) is 3.65 feet away from the camera, so you need to walk 3.65 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/592126710907e20c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, blue fabric jacket at center or dark blue fabric at center, stands shorter?" }, { "from": "gpt", "value": "dark blue fabric at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1b79dd77f282e0b.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.298, 0.863) come in front of point (0.067, 0.706)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1dc790231f9ba47a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer planning to capture the grand building with both the green leafy tree at lower left and the green leafy tree at lower center in the frame. Which tree should you position closer to the edge of the frame to maintain balance?" }, { "from": "gpt", "value": "You should position the green leafy tree at lower left closer to the edge of the frame because it has a lesser width compared to the green leafy tree at lower center, helping to balance the composition." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d226062ed8e8047.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a closeup of the panda in the center. You notice two points in the image labeled as point 1 at coordinates point (0.128, 0.786) and point 2 at coordinates point (0.230, 0.625). Which point is closer to your camera lens?" }, { "from": "gpt", "value": "Point (0.128, 0.786) is closer to the camera lens than point (0.230, 0.625) because it is further to the camera than the other point." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a705cc1eaff3b2ed.jpg", "conversations": [ { "from": "human", "value": "\nIs light wood table at center behind matte plastic banner at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43c326f41852b092.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the urban square and want to place your matte black backpack at center on the ground. The square has a maximum weight capacity of 50 kg per square meter. Can you confirm if the location at point 0.859, 0.663 is within the safe load limit?" }, { "from": "gpt", "value": "The matte black backpack at center is located at point (0.663, 0.859), but the square has a maximum weight capacity of 50 kg per square meter. Without knowing the weight of the backpack or the area it will occupy, it is impossible to determine if it exceeds the safe load limit." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6f8cca9ad027a3d.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, matte black t-shirt at center or white lace dress at center?" }, { "from": "gpt", "value": "matte black t-shirt at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/145033a26ddfaf05.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.294, 0.603) or point (0.754, 0.780)?" }, { "from": "gpt", "value": "Point (0.294, 0.603)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/944e81671b31c222.jpg", "conversations": [ { "from": "human", "value": "\nIs brown dry grass at center shorter than bare wood tree at upper right?" }, { "from": "gpt", "value": "No, brown dry grass at center is not shorter than bare wood tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47a0dadfade9ce4d.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to orange glass bottle at left? Please provide its 2D coordinates.Where can I find orange glass bottle at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.231, 0.502)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b102037838054a83.jpg", "conversations": [ { "from": "human", "value": "\nBased on the scene description, can you determine the relative position of the white frothy water at center and the gray rock at left? Please explain using the given information." }, { "from": "gpt", "value": "The white frothy water at center is above the gray rock at left according to the description provided." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4548228a34b1bbc0.jpg", "conversations": [ { "from": "human", "value": "\nWhere is marble tower at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.243, 0.556)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3eeff2eff3cd6465.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is curly hair at center from camera?" }, { "from": "gpt", "value": "curly hair at center is 1.04 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3abc9a9585e0feee.jpg", "conversations": [ { "from": "human", "value": "\nHow close is wooden stained bass at center from strawmaterial/texturehat at upper right?" }, { "from": "gpt", "value": "25.61 inches" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e01c4e038c9d861.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the center of the scene. You want to take a photo that includes both the point at point (0.408, 0.573) and the point at point (0.334, 0.456). Based on their positions, which point should you focus on first to ensure both are in frame?" }, { "from": "gpt", "value": "You should focus on point (0.334, 0.456) first because it is behind point (0.408, 0.573), so starting with the farther point ensures both are within the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96d2d0a2997c68aa.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the garage and want to determine which of the two points, point (0.450, 0.580) or point (0.431, 0.497), is closer to you. Based on their positions in the image, which one would you say is nearer?" }, { "from": "gpt", "value": "Point (0.450, 0.580) is further to the camera than point (0.431, 0.497), so the closer point to you is point (0.431, 0.497)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b26bc069b3cf5ffa.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.949, 0.589)?" }, { "from": "gpt", "value": "green leafy plant at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06afbf84cfc45c63.jpg", "conversations": [ { "from": "human", "value": "\nIs leather at center smaller than wooden desk at center?" }, { "from": "gpt", "value": "Incorrect, leather at center is not smaller in size than wooden desk at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/feadc17a5fc071ca.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian standing at the entrance of the mosque. You want to walk to the light blue fabric at center without stepping on the shiny dark brown car at lower right. Which direction should you walk to avoid it?" }, { "from": "gpt", "value": "The shiny dark brown car at lower right is positioned on the left side of light blue fabric at center. To avoid stepping on it, you should walk to the right side of the light blue fabric at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/246dd6ecac4c0659.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.528, 0.487) positioned after point (0.830, 0.631)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/784412476984bb2e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point marked as point (0.147, 0.619) in the scene. How far do you need to walk to get there?" }, { "from": "gpt", "value": "The distance of point (0.147, 0.619) from camera is 3.92 meters, so you need to walk 3.92 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d519073c7c108d48.jpg", "conversations": [ { "from": "human", "value": "\nLocate the black fabric tank top at lower right in the image." }, { "from": "gpt", "value": "[(0.839, 0.830)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59f0b7da0bcd5e2b.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.321, 0.467) come closer to viewer compared to point (0.643, 0.192)?" }, { "from": "gpt", "value": "Yes, point (0.321, 0.467) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03565dfeeacd5ffc.jpg", "conversations": [ { "from": "human", "value": "\nWhere is the white matte table at center located in the image?" }, { "from": "gpt", "value": "The white matte table at center is located at point (0.305, 0.820)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b08f82466293f46b.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.718, 0.555) farther from camera compared to point (0.071, 0.655)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fd74c6802a1ba5c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte truck at center is bigger than brown fur cow at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd144a52ac58e991.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.848, 0.839) or (0.960, 0.539)?" }, { "from": "gpt", "value": "Positioned behind is point (0.960, 0.539)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad2a5a979aeca1eb.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange reflective vest at center appear over orange reflective safety vest at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2edbb5bd649f4114.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.318, 0.898)?" }, { "from": "gpt", "value": "white matte shirt at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4eddf8b7b12ff4be.jpg", "conversations": [ { "from": "human", "value": "\nPoint to yellow stone church at center.Point to the yellow stone church at center in the image." }, { "from": "gpt", "value": "[(0.474, 0.544)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4d4c2308edab50e.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of dark gray sweater at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.625, 0.631)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b5260af3d714b60.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.545, 0.281)?" }, { "from": "gpt", "value": "golden stone minaret at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5edc263c3c5ed422.jpg", "conversations": [ { "from": "human", "value": "\nYou are attending a meeting in this room and need to hand a document to both the camouflage uniform at center and the dark gray suit at center. In what order should you approach them from your current position at the entrance door located to the right of the televisions?" }, { "from": "gpt", "value": "You should approach the camouflage uniform at center first because they are positioned to the left of the dark gray suit at center, making them closer to your entrance point on the right side of the televisions." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/771430449cdce0dd.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.770, 0.895) come behind point (0.500, 0.716)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a162fc34dd5625dc.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.960, 0.034) come closer to viewer compared to point (0.122, 0.270)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39eff5508110027b.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer positioned at the front of the stage. You need to take a photo that includes both the leather jacket at lower right and the microphone holder. Can you fit both in your camera frame if your field of view is limited to the bottom half of the stage?" }, { "from": "gpt", "value": "The leather jacket at lower right is located at point (0.984, 0.820). Since the photographer is at the front and the field of view is limited to the bottom half of the stage, both the leather jacket at lower right and the microphone holder should be within the frame as they are positioned in the lower section of the stage." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f7a9f91bfffd5bc.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, wooden-handled knife at right or polished silver fork at left?" }, { "from": "gpt", "value": "polished silver fork at left is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26c114259e3ffb1d.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the stage and want to move to the orange cotton shirt at lower left. Which direction should you move to reach it?" }, { "from": "gpt", "value": "The orange cotton shirt at lower left is located at point 0.536 in the x coordinate and 0.321 in the y coordinate. Since you are at the center of the stage, moving towards the lower left direction will lead you to the orange cotton shirt at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/459ab6786b7069ab.jpg", "conversations": [ { "from": "human", "value": "\nIs matte silver golf cart at center wider than black and white striped zebra at center?" }, { "from": "gpt", "value": "No, matte silver golf cart at center is not wider than black and white striped zebra at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed210fb13e1b7027.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.957, 0.522)?" }, { "from": "gpt", "value": "smooth concrete harbor at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b0a7bff4494bcfe.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.341, 0.772) or (0.911, 0.391)?" }, { "from": "gpt", "value": "Positioned in front is point (0.341, 0.772)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3a29e80297ca2ac.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.336, 0.436) behind point (0.758, 0.675)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c6ecf4970a9a811.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black wire cage at left is bigger than black and white fur cat at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6b5066070b7ac39.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a group photo of the blue checkered shirt at center and the satin pink blouse at center. Since you want to ensure both are clearly visible, which one should you focus on first to account for their sizes?" }, { "from": "gpt", "value": "The blue checkered shirt at center is bigger than the satin pink blouse at center, so you should focus on the blue checkered shirt at center first as it occupies more space in the frame, ensuring it is in focus before adjusting for the smaller satin pink blouse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c7f28e6435a5146.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white matte mannequin at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.252, 0.609)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/197336ccbe71c889.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of yellow plastic tape at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.813, 0.214)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88144dbb0270af3e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the lake and want to reach the point marked as point (0.473, 0.414). Based on the description, how far is this point from your current position?" }, { "from": "gpt", "value": "The point (0.473, 0.414) is 393.48 meters away from the viewer, so you are 393.48 meters away from the point." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91baf77b05db69f6.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, matte brown face at center or teethwhitetooth at center?" }, { "from": "gpt", "value": "teethwhitetooth at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f6951a9fec557b4.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of brown fabric chair at center from camera?" }, { "from": "gpt", "value": "3.65 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9d436477a260744.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between brown textured bark at left and light brown fur at center." }, { "from": "gpt", "value": "4.43 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d333e581569eb5a2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a visitor walking on the gray stone path at center in a traditional Chinese garden. You want to place a small souvenir on the gray stone railing at center. Can you do this without needing to climb up? Explain why based on their heights." }, { "from": "gpt", "value": "The gray stone path at center has a lesser height compared to the gray stone railing at center. Since the railing is taller than the path, you would need to climb up slightly to place the souvenir on the railing." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c28a83977627b7f.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, white matte ferry at center or clear water at lower center?" }, { "from": "gpt", "value": "white matte ferry at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d109636a6ae2a5f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who wants to take a photo of the white matte flower at center while avoiding the green leafy tree at upper center blocking the view. Which direction should you move to ensure the tree is out of the frame?" }, { "from": "gpt", "value": "The green leafy tree at upper center is above the white matte flower at center, so moving downward or to the side away from the tree would position the flower in the foreground without the tree obstructing the view." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a452d9738da50bde.jpg", "conversations": [ { "from": "human", "value": "\nIs bare branches at upper center thinner than green mossy statue at lower right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1765ab74e5fe5f3a.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.373, 0.791) and point (0.600, 0.831), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.600, 0.831)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a2ea11d257903b9.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of dark gray suit at center from camera?" }, { "from": "gpt", "value": "dark gray suit at center is 2.72 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/775cdf70397f0eaf.jpg", "conversations": [ { "from": "human", "value": "\nBetween yellow matte leopard at lower left and matte brown monkey at upper left, which one has less height?" }, { "from": "gpt", "value": "With less height is matte brown monkey at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1acd3adc07899b54.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.710, 0.584) and point (0.567, 0.275), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.567, 0.275)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/211327feb19e9ce6.jpg", "conversations": [ { "from": "human", "value": "\nIs brown woolen scarf at center below brown woven scarf at center?" }, { "from": "gpt", "value": "Yes, brown woolen scarf at center is below brown woven scarf at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e898f53a4b38836.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the gray cobblestone pavement at center and want to reach the red matte bicycle at right. How far do you need to walk?" }, { "from": "gpt", "value": "The gray cobblestone pavement at center is 7.12 feet away from the red matte bicycle at right, so you need to walk 7.12 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a64805cbf319cc97.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, gray matte shirt at center or black plastic chair at center, stands taller?" }, { "from": "gpt", "value": "Standing taller between the two is gray matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4aa95f643a88c24b.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a superhero costume parade and need to arrange the black matte suit at center and the leather jacket at right in a line. Which costume should be placed first if you want the wider costume to be on the left side?" }, { "from": "gpt", "value": "The black matte suit at center should be placed first on the left side because it is wider than the leather jacket at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/770d23a60fd2f933.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, matte plastic pasta at center or white glossy plate at center, stands shorter?" }, { "from": "gpt", "value": "Standing shorter between the two is white glossy plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0db53e39cb116bbe.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to place a package that is 4 feet wide between the patchwork fabric bed at center and the gray cotton shirt at lower left. Can you fit the package between them without moving either object?" }, { "from": "gpt", "value": "The distance between the patchwork fabric bed at center and the gray cotton shirt at lower left is 4.01 feet. Since the package is 4 feet wide, it can fit between them as there is enough space." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c64538bd6594e63.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the hardcover books at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.708, 0.312)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97fdc09d9f592d61.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of dark blue suit at right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.875, 0.572)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6254cf8cf282901.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of white cotton tank top at upper center?" }, { "from": "gpt", "value": "A distance of 32.37 feet exists between white cotton tank top at upper center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02333ea43e8552ff.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, orange fleece jacket at center or yellow matte bananas at upper right?" }, { "from": "gpt", "value": "With less height is yellow matte bananas at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b04a5c9de2bf20a.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any smooth wooden floor at center in the image." }, { "from": "gpt", "value": "[(0.471, 0.842)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ec590c00d18c1be.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of matte pink tank top at center in the image." }, { "from": "gpt", "value": "[(0.518, 0.495)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b30458b4e761d36.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to pink fabric dress at center? Please provide its 2D coordinates.Where can I find pink fabric dress at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.254, 0.625)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4961a85cbe7347b.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.887, 0.730) from camera?" }, { "from": "gpt", "value": "Point (0.887, 0.730) and camera are 12.41 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18af00dcb127c9f0.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the bridge walkway and see the green leafy water at center and the dark hair person at center in the scene. Which object is positioned to the right of the other?" }, { "from": "gpt", "value": "The green leafy water at center is to the right of dark hair person at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2abec3df2dcc9a3b.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, fluffy pink coat at center or fluffy pink jacket at center?" }, { "from": "gpt", "value": "fluffy pink jacket at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef7c1578bcb4771b.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.266, 0.417) or (0.570, 0.242)?" }, { "from": "gpt", "value": "Positioned behind is point (0.570, 0.242)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6730c377ee50075f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, black suit at left or clear plastic water bottles at lower center, stands shorter?" }, { "from": "gpt", "value": "clear plastic water bottles at lower center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1c4192d088feeb7.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of rugged brown rock at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.401, 0.552)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b80f19eef90f1356.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.589, 0.388) or (0.694, 0.970)?" }, { "from": "gpt", "value": "Positioned behind is point (0.589, 0.388)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32ddd4f7e4ee47df.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.294, 0.530) in the image. How far are you from the camera?" }, { "from": "gpt", "value": "The distance of point (0.294, 0.530) from camera is 4.15 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f451e256ea9acd89.jpg", "conversations": [ { "from": "human", "value": "\nHow far apart are green stone river at center and green textured trees at upper center?" }, { "from": "gpt", "value": "They are 109.03 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f587e4aac68b8b66.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of brown rough bark tree at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.641, 0.500)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37faa2a8be0f28c9.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the same position as the person in the image and want to determine which of the two points, point (0.267, 0.705) or point (0.882, 0.528), is closer to you. Based on the scene, which point is nearer?" }, { "from": "gpt", "value": "Point (0.267, 0.705) is closer to the viewer than point (0.882, 0.528)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/333cc4478fbdd657.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between blue water at center and camera." }, { "from": "gpt", "value": "The distance of blue water at center from camera is 20.89 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e9fbe1b6dd26b34.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver metallic pole at left come behind metallic pole at right?" }, { "from": "gpt", "value": "No, silver metallic pole at left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/108eabba040f2da9.jpg", "conversations": [ { "from": "human", "value": "\nIs black wood fence at left bigger than light brown antelope at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c55345118c23dafc.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, green grass at lower left or dark gray t-shirt at left, stands taller?" }, { "from": "gpt", "value": "dark gray t-shirt at left is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea54eb014941be31.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.702, 0.764) lie behind point (0.336, 0.853)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e5a1bc024ee8db7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown gravel beach at lower left is thinner than brown gravelly sand at center?" }, { "from": "gpt", "value": "Incorrect, brown gravel beach at lower left's width is not less than brown gravelly sand at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e9dbbff410b639c.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny red keyboard at center have a larger size compared to blue fabric flag at upper right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c374056a0e12476.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if floral-patterned fabric bag at left is positioned to the right of maroon woolen blazer at center?" }, { "from": "gpt", "value": "In fact, floral-patterned fabric bag at left is to the left of maroon woolen blazer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/312a1bf188c56167.jpg", "conversations": [ { "from": "human", "value": "\nPoint to clear water at center.Point to the clear water at center in the image." }, { "from": "gpt", "value": "[(0.657, 0.716)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b86f77c839fbd2df.jpg", "conversations": [ { "from": "human", "value": "\nDoes satin wood table at center have a lesser height compared to blue cotton shirt at upper center?" }, { "from": "gpt", "value": "Correct, satin wood table at center is not as tall as blue cotton shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f3b7b3dd38ecef7.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red dress at center have a larger size compared to purple cotton shorts at center?" }, { "from": "gpt", "value": "Correct, matte red dress at center is larger in size than purple cotton shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37165c140f2ed1d0.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between green bamboo at center and camera?" }, { "from": "gpt", "value": "The distance of green bamboo at center from camera is 23.21 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3efe3b16784b99de.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, transparent glass door at upper right or matte skin hand at center?" }, { "from": "gpt", "value": "transparent glass door at upper right is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2151c19a1ab4a675.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.416, 0.831) or point (0.244, 0.316)?" }, { "from": "gpt", "value": "Point (0.416, 0.831)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec6d766fc29ef227.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, black matte shirt at center or matte blue shirt at upper left?" }, { "from": "gpt", "value": "black matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3985bd481a307406.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a blue printed shirt at left. Pinpoint a point to the blue printed shirt at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.182, 0.550)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/041fc67a5009c94c.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the golden crispy fried chicken at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.775, 0.791)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8ac95256c49e766.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white matte water at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.075, 0.697)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e07bd12ab175d61.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, white matte banjo at left or wooden violin at right?" }, { "from": "gpt", "value": "With more height is wooden violin at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c9a2cacf51a8867.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte broccoli at center positioned behind green matte tree at left?" }, { "from": "gpt", "value": "Yes, green matte broccoli at center is further from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed506ba2a7cb8c0a.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of white fabric crowd at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.168, 0.225)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1dd61c8edea5013.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic podium at center is smaller than yellow striped dress shirt at center?" }, { "from": "gpt", "value": "Incorrect, metallic podium at center is not smaller in size than yellow striped dress shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d09dd97ea3d30230.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, matte white plush at lower right or white glossy paw at lower left?" }, { "from": "gpt", "value": "matte white plush at lower right is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8d31ff49c2fb4f8.jpg", "conversations": [ { "from": "human", "value": "\nCould you measure the distance between blue fabric boat at lower right and satin black car at center?" }, { "from": "gpt", "value": "15.23 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/101a57c7ff86e47d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a person sitting in the pink fabric armchair at lower left. You want to hand a toy to someone standing in front of you. Is the distance between you and the person in front of you sufficient to reach them?" }, { "from": "gpt", "value": "The distance between the pink fabric armchair at lower left and the viewer is 38.80 inches, so yes, the person can reach them since the distance is within typical arm reach." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57b3667b98e7fde8.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.280, 0.453) positioned behind point (0.726, 0.677)?" }, { "from": "gpt", "value": "No, (0.280, 0.453) is in front of (0.726, 0.677)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5203eb0e616e4ea0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, pastel blue plastic birdcage at right or matte plastic cash register at left, stands taller?" }, { "from": "gpt", "value": "pastel blue plastic birdcage at right is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/080258a88530deeb.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, green matte christmas tree at center or green artificial christmas tree at left?" }, { "from": "gpt", "value": "Standing shorter between the two is green artificial christmas tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c9e50a8b2def415.jpg", "conversations": [ { "from": "human", "value": "\nYou are a botanist examining the natural scene. You notice the green mossy bark at center. Can you determine its exact position in the image using coordinates?" }, { "from": "gpt", "value": "The green mossy bark at center is located at point coordinates of (0.551, 0.841)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/799df7a68a4d4208.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue water at lower center is wider than tie-dye fabric dress at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42ac027e68f9d06e.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green matte glass jar at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.403, 0.369)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b868ddecd2b0ff8.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.261, 0.362) lie behind point (0.349, 0.572)?" }, { "from": "gpt", "value": "No, (0.261, 0.362) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90a8efbac9207b40.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the white textured building at right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.907, 0.480)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11f8131da2c79e24.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.414, 0.081) or point (0.735, 0.473)?" }, { "from": "gpt", "value": "The point (0.735, 0.473) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5616e612fdf3240f.jpg", "conversations": [ { "from": "human", "value": "\nDoes white textured hair at center appear over matte black dress at center?" }, { "from": "gpt", "value": "Incorrect, white textured hair at center is not positioned above matte black dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a12977d66c97b674.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, tortoiseshell sunglasses at upper left or stone tower at upper center?" }, { "from": "gpt", "value": "Positioned to the left is stone tower at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f69b800561518c0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray wool suit at right is wider than satin blue blazer at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/970ee640cd9acd20.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray matte deer at center is bigger than brown fur antelope at center?" }, { "from": "gpt", "value": "Incorrect, gray matte deer at center is not larger than brown fur antelope at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3b829ad9fccb8de.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point marked as point (0.843, 0.856) in the image. How far do you need to walk to get there?" }, { "from": "gpt", "value": "The distance of point (0.843, 0.856) from the camera is 49.66 meters, so you need to walk 49.66 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5722424bd798c64.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, brown muddy water at lower center or matte gray hippo at center, stands shorter?" }, { "from": "gpt", "value": "matte gray hippo at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97736ca6e95440b0.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white glass window at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.708, 0.406)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a798edcc5db2d93f.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.209, 0.514) and camera." }, { "from": "gpt", "value": "Point (0.209, 0.514) is 6.35 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f95257bdf88d010.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.453, 0.373) or (0.396, 0.280)?" }, { "from": "gpt", "value": "The point (0.396, 0.280) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2cdb5b3ca39affbd.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.444, 0.650)?" }, { "from": "gpt", "value": "white paper sign at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6873e43ee00ac785.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the large concrete archway with graffiti and see two points marked in the scene. The first point is at coordinates point (0.756, 0.667) and the second is at point (0.212, 0.483). Which point is closer to you?" }, { "from": "gpt", "value": "Point (0.756, 0.667) is further to the viewer than point (0.212, 0.483), so the second point is closer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17ed3f2c5fc10198.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark wood portrait at upper center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.371, 0.077)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/174d21f6966d2ac1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a visitor approaching the entrance of the East Asian architectural structure. You see the white stone path at center and the white stone pillar at center. Which object is closer to the entrance?" }, { "from": "gpt", "value": "The white stone path at center is located below the white stone pillar at center, so the path is closer to the entrance than the pillar." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18979b2901f0ded1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up a shot of the scene described. You want to place a light to the left of the matte black sweater at left and another light to the right of the blue fabric chair at center. Will the two lights be aligned horizontally or vertically?" }, { "from": "gpt", "value": "The matte black sweater at left is positioned on the left side of the blue fabric chair at center, so placing a light to the left of the matte black sweater at left and another to the right of the blue fabric chair at center would result in the two lights being aligned horizontally." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/998ec2f1ec4defad.jpg", "conversations": [ { "from": "human", "value": "\nDoes white asphalt at center appear on the left side of white matte tank top at center?" }, { "from": "gpt", "value": "Incorrect, white asphalt at center is not on the left side of white matte tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a62784201599190.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.845, 0.491) or point (0.925, 0.008)?" }, { "from": "gpt", "value": "Point (0.845, 0.491)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00899a2155440435.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the metallic blue cart at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.881, 0.770)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60de01fefd2b8533.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.074, 0.714) lie in front of point (0.347, 0.819)?" }, { "from": "gpt", "value": "No, (0.074, 0.714) is behind (0.347, 0.819)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30f1f55cd7234f19.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, striped cotton shirt at left or matte black shirt at center?" }, { "from": "gpt", "value": "matte black shirt at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/811ea9d7c18a4fb8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker carrying a 30 feet long rope. You spot the green mossy rocks at center and the clear water at center in the scene. Can you safely use your rope to cross the gap between them?" }, { "from": "gpt", "value": "The distance between the green mossy rocks at center and the clear water at center is 29.79 feet. Since your rope is 30 feet long, it is just long enough to safely cross the gap between them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ea04a7793e6979d.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of plaid fabric shirt at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.834, 0.859)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b888e05817e962e4.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.682, 0.370) lie in front of point (0.376, 0.598)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12946c43c4a708be.jpg", "conversations": [ { "from": "human", "value": "\nLocate all white matte table at center in the image." }, { "from": "gpt", "value": "[(0.461, 0.648)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/097851e8e91f0034.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between white matte radiator at lower center and camera." }, { "from": "gpt", "value": "white matte radiator at lower center is 4.10 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05ff0c0d556b3514.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and want to capture both the light beige skirt at center and the brown textured coat at center in the same frame. Which object should you focus on first to ensure both are in the shot?" }, { "from": "gpt", "value": "You should focus on the brown textured coat at center first because the light beige skirt at center is positioned under it, so adjusting the camera angle to include the lower area where the skirt is located will naturally include the coat above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ed369a9a534883a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if fuzzy beige knit cap at upper right is taller than white puffy coat at center?" }, { "from": "gpt", "value": "Indeed, fuzzy beige knit cap at upper right has a greater height compared to white puffy coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf112fffe34dfca5.jpg", "conversations": [ { "from": "human", "value": "\nPoint to green leafy tree at center.Point to the green leafy tree at center in the image." }, { "from": "gpt", "value": "[(0.500, 0.306)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11c70ae2252e3c59.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.615, 0.511) positioned behind point (0.985, 0.603)?" }, { "from": "gpt", "value": "No, (0.615, 0.511) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9991b03d5ff75503.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of bronze statue at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.498, 0.588)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3cc3cf2d2f0bbea7.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, matte pink shirt at center or blue woven hat at center?" }, { "from": "gpt", "value": "Positioned to the right is blue woven hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffac1af3c3a268ea.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if translucent glass pillar at center is positioned above rusty metal chair at center?" }, { "from": "gpt", "value": "No, translucent glass pillar at center is not above rusty metal chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcc6f139f6bb2e83.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.767, 0.284) and point (0.640, 0.961), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.767, 0.284) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/599c9e57fa47bdb7.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a matte gray train at center. Pinpoint a point to the matte gray train at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.788, 0.581)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a257164df9107367.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian standing at the crosswalk and want to take a photo of both the shiny silver sedan at right and the metallic silver car at center. Which car should you look down at to include both in your shot?" }, { "from": "gpt", "value": "To include both the shiny silver sedan at right and the metallic silver car at center in your photo, you should look down at the shiny silver sedan at right since it is located below the metallic silver car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2157aa30ffb44e38.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.333, 0.867) from the camera?" }, { "from": "gpt", "value": "They are 3.73 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4d3edcdffb49bb4.jpg", "conversations": [ { "from": "human", "value": "\nPoint to brown/dry wood tree at left.Point to the brown/dry wood tree at left in the image." }, { "from": "gpt", "value": "[(0.153, 0.527)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a3c94f9c5d893fd.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.230, 0.127) or (0.509, 0.892)?" }, { "from": "gpt", "value": "Point (0.230, 0.127)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d46bd7006a27f847.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between matte ceramic mug at center and camera?" }, { "from": "gpt", "value": "matte ceramic mug at center and camera are 13.65 inches apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed84d64c24970467.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.201, 0.358)?" }, { "from": "gpt", "value": "brown leather suitcase at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29dd8478da7e58cf.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the edge of the court, wanting to capture both the black matte shirt at center and the white matte shirt at center in a single shot. Your camera has a maximum focal length that allows a 10 feet wide field of view. Can you fit both subjects within the frame without moving closer?" }, { "from": "gpt", "value": "The distance between the black matte shirt at center and white matte shirt at center is 8.46 feet, which is less than the camera field of view of 10 feet. Therefore, you can fit both subjects within the frame without moving closer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53e2d1a810794fdc.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.106, 0.198) or point (0.343, 0.355)?" }, { "from": "gpt", "value": "Positioned behind is point (0.343, 0.355)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0048f11fc5b63d5f.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of metallic silver car at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.738, 0.383)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d4832c1b0f06689.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.199, 0.534) and camera." }, { "from": "gpt", "value": "Point (0.199, 0.534) is 4.84 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fecbbe7a4c6d30fd.jpg", "conversations": [ { "from": "human", "value": "\nDoes green plastic cucumbers at left appear on the right side of ripe red tomato at upper right?" }, { "from": "gpt", "value": "In fact, green plastic cucumbers at left is to the left of ripe red tomato at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4768631716d9b10.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white matte uniform at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.817, 0.869)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2a350887599048b.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of black fur cat at center from camera?" }, { "from": "gpt", "value": "A distance of 13.88 meters exists between black fur cat at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e8d3a92c0b0211f.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, black fabric at lower left or blue floral dress at lower right?" }, { "from": "gpt", "value": "black fabric at lower left is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ee457cf07f65f5d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray cotton shirt at lower right is wider than white glossy shell at center?" }, { "from": "gpt", "value": "Indeed, gray cotton shirt at lower right has a greater width compared to white glossy shell at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e78f481e53e6ea9a.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of multicolored paper cutouts at upper left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.200, 0.186)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24666e22ebfca6f5.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the wooden walkway and see two people wearing a matte black coat at center and a red fabric jacket at center. Which person is standing closer to the ground?" }, { "from": "gpt", "value": "The matte black coat at center is located below the red fabric jacket at center, so the person wearing the matte black coat at center is standing closer to the ground." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f815007d760d135.jpg", "conversations": [ { "from": "human", "value": "\nYou are a guest staying in this rustic room and want to place your phone on the closest object to the window. The objects available are the white soft bed at right and the white soft pillow at center. Which object should you choose?" }, { "from": "gpt", "value": "The white soft pillow at center is closer to the window than the white soft bed at right, so you should place your phone on the white soft pillow at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8429f38dfbe50c37.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between purple fabric jacket at upper right and matte white cup at center." }, { "from": "gpt", "value": "They are 21.09 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c652d91cea418535.jpg", "conversations": [ { "from": "human", "value": "\nLocate the white matte shutters at center in the image." }, { "from": "gpt", "value": "[(0.352, 0.377)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b60036b09848d16.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.782, 0.516) or point (0.428, 0.344)?" }, { "from": "gpt", "value": "The point (0.428, 0.344) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6169a45c65dab10.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the two people in the image. Which point, point (0.409, 0.655) or point (0.713, 0.380), is closer to you?" }, { "from": "gpt", "value": "Point (0.409, 0.655) is closer to you because it is in front of point (0.713, 0.380)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4080446a44f018e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray concrete pavement at center is bigger than matte black suit at left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbbb10fa22f6ff65.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.844, 0.744) farther from camera compared to point (0.294, 0.705)?" }, { "from": "gpt", "value": "Yes, point (0.844, 0.744) is farther from viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bde0bd754b36647b.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.199, 0.706) and point (0.614, 0.817), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.614, 0.817)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fcef7f7e48c69c2.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, translucent glass beer bottle at left or yellow mashed potato at center?" }, { "from": "gpt", "value": "yellow mashed potato at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a496b15e0d48c37.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between white plastic boat at center and camera." }, { "from": "gpt", "value": "white plastic boat at center is 101.71 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/971d295561f0a6cc.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of cloudy gray sky at upper center?" }, { "from": "gpt", "value": "A distance of 1026.52 feet exists between cloudy gray sky at upper center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02c10d28734afb7d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.223, 0.984) or point (0.866, 0.338)?" }, { "from": "gpt", "value": "The point (0.223, 0.984) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee7c95f995ebb26b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the center of the room and want to hand a document to the person wearing the dark gray vest at center. Based on their position, which direction should you move to reach them?" }, { "from": "gpt", "value": "The dark gray vest at center is located at point (0.748, 0.675), so you should move towards the lower right direction from the center to reach them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/585101a1e7ae5d84.jpg", "conversations": [ { "from": "human", "value": "\nYou are an attendee at this presentation. You notice the white paper at upper center and the dark gray suit at left. Which object is positioned higher in the image?" }, { "from": "gpt", "value": "The white paper at upper center is positioned higher than the dark gray suit at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d68e2ff39b360cf.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow reflective vest at left below orange reflective traffic cone at lower right?" }, { "from": "gpt", "value": "No, yellow reflective vest at left is not below orange reflective traffic cone at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c8f4f15a71c5829.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position looking at the scene. There is a point marked at coordinates point (0.979, 0.936). How far is that point from your current position?" }, { "from": "gpt", "value": "The point (0.979, 0.936) is 57.12 meters away from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/602c8c9f45189d0e.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of shiny red snowmobile at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.624, 0.845)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06c293fd29a0a7e9.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between black matte hoodie at upper left and camera?" }, { "from": "gpt", "value": "black matte hoodie at upper left and camera are 9.43 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/800b893e55f02612.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.656, 0.919) less distant than point (0.737, 0.398)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.737, 0.398)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3001263254a1f97.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.633, 0.248)?" }, { "from": "gpt", "value": "khaki fabric bag at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7b5084703db7f30.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white fur cat at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.699, 0.463)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f95ac72efb2671bd.jpg", "conversations": [ { "from": "human", "value": "\nBetween blue water at center and gray asphalt highway at lower center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, gray asphalt highway at lower center appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e618736d8ecfd7d5.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.223, 0.495) and point (0.176, 0.591), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.223, 0.495) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/594b206798137f34.jpg", "conversations": [ { "from": "human", "value": "\nYou are a zookeeper observing the alpacas. You need to separate them into two different feeding areas. The white fluffy alpaca at left must be moved to the left feeding area, and the fuzzy brown alpaca at upper center must be moved to the right feeding area. Based on their current positions, which alpaca is closer to its designated feeding area?" }, { "from": "gpt", "value": "The white fluffy alpaca at left is already positioned to the left, so it is closer to the left feeding area. The fuzzy brown alpaca at upper center is to the right of the white one, meaning it is closer to the right feeding area." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b304cc5b75b568e8.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, velvet red couch at lower left or floral fabric pillow at center?" }, { "from": "gpt", "value": "floral fabric pillow at center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95c77b9577492975.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of gray rocky mountain at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.575, 0.303)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4603164f92e54f08.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is wooden walkway at center from silver metallic rail at center?" }, { "from": "gpt", "value": "wooden walkway at center is 13.99 feet from silver metallic rail at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/016c08a4d7640724.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the green leafy coconut tree at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.584, 0.353)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/065ecb6c16cba469.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, striped cotton shirt at lower right or black rubber skateboard at center?" }, { "from": "gpt", "value": "black rubber skateboard at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1174addb05a46ebf.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the black fabric camera at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.377, 0.561)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/941afd87ca54f820.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between navy blue polo shirt at left and textured gray shirt at center." }, { "from": "gpt", "value": "The distance of navy blue polo shirt at left from textured gray shirt at center is 24.84 inches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f4d0f58c1ae64e7.jpg", "conversations": [ { "from": "human", "value": "\nBetween white glossy cruise ship at upper right and metallic silver van at center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "Positioned to the left is metallic silver van at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d7b43e2bc55b360.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.048, 0.797) in front of point (0.060, 0.675)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.060, 0.675)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2aba466fb6f8735.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, camouflagetextured fabricarmy uniform at center-right or soft pink rose at lower left?" }, { "from": "gpt", "value": "camouflagetextured fabricarmy uniform at center-right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/073b7cb65f4d8ad4.jpg", "conversations": [ { "from": "human", "value": "\nYou are taking a photo of the person in the scene. You want to focus on the point at point (0.239, 0.767) and point (0.688, 0.244). Which point should you focus on first to ensure both are in focus?" }, { "from": "gpt", "value": "Point (0.239, 0.767) is closer to the camera than point (0.688, 0.244), so you should focus on point (0.239, 0.767) first to ensure both are in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1609ad705f34d540.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.045, 0.842) positioned before point (0.716, 0.397)?" }, { "from": "gpt", "value": "Yes, point (0.045, 0.842) is in front of point (0.716, 0.397)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/849a848117cf4161.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between tan leather jacket at center and camera." }, { "from": "gpt", "value": "tan leather jacket at center and camera are 32.86 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bc33253a1ac846c.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the dark brown wooden barge at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.509, 0.631)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c248d0ed539cf427.jpg", "conversations": [ { "from": "human", "value": "\nBetween smooth black hair at right and light brown silky hair at center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "Positioned to the right is smooth black hair at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/999e0bdd68109616.jpg", "conversations": [ { "from": "human", "value": "\nYou are an observer looking at the seascape. You notice the silhouette skin at upper right and the silky white sail at center. Which object is positioned higher in the image?" }, { "from": "gpt", "value": "The silhouette skin at upper right is positioned higher in the image than the silky white sail at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07c99dd58578f41b.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker navigating through the forest and want to identify the smaller tree between the green leafy tree at center and the green rough bark tree at center. Which one should you look for?" }, { "from": "gpt", "value": "The green leafy tree at center occupies less space than the green rough bark tree at center, so you should look for the green leafy tree at center as it is the smaller one." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a97299f60ed8668.jpg", "conversations": [ { "from": "human", "value": "\nWhere is bare branches tree at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.242, 0.397)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22356ec4da25e3ca.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the stop sign on the right side of the railway track. Looking towards the tracks, you notice two points marked in the scene. Which of the two points, point (0.442, 0.703) or point (0.914, 0.817), is closer to your current position?" }, { "from": "gpt", "value": "Point (0.914, 0.817) is closer to your current position because it is in front of point (0.442, 0.703) according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f5a01c160ba8e0d.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the navy blue hoodie at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.381, 0.648)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/acb0dbef5a7c8401.jpg", "conversations": [ { "from": "human", "value": "\nLocate teal wooden door at right in the image." }, { "from": "gpt", "value": "[(0.810, 0.458)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d350280523f5bb01.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the conference room and want to find the matte black suit at left. According to the coordinates provided, where should you look?" }, { "from": "gpt", "value": "The matte black suit at left is located at the 2D coordinates point (0.209, 0.509)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b78e5c390f17e09.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped shirt at center come behind silver metallic laptop at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc55b0062bf32c16.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker standing at the base of the scene. You want to walk from the weathered wood fence at center to the green grassy hill at upper center. Which direction should you move to reach the hill?" }, { "from": "gpt", "value": "You should move upward from the weathered wood fence at center towards the green grassy hill at upper center since the hill is located above the fence and further away from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa36a74905539a92.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker carrying a heavy backpack and notice two paths in the forest. One is the brown textured dirt path at center and the other is the brown gravel path at center. Which path should you take if you want to walk on the upper layer?" }, { "from": "gpt", "value": "You should take the brown textured dirt path at center because it is above the brown gravel path at center, making it the upper layer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e164addf04784d40.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if purple glossy race car at center is positioned to the right of striped fabric pants at lower left?" }, { "from": "gpt", "value": "Indeed, purple glossy race car at center is positioned on the right side of striped fabric pants at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27d81b4a000a8511.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a white paper sign at upper center. Pinpoint a point to the white paper sign at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.444, 0.120)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a06c1acc59b1418f.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white cotton shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.825, 0.642)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2cc62a89336d7c7.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, green fabric shirt at center or hardcover book at center?" }, { "from": "gpt", "value": "green fabric shirt at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d303404368a65ebc.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.352, 0.439)." }, { "from": "gpt", "value": "brown muddy water at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0fcaa2cbec37f78.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator trying to capture a clear image of the white paper banner at center from your position near the dark hair at center. Given that your drone can fly up to 15 meters, will it be able to reach the banner?" }, { "from": "gpt", "value": "The dark hair at center is 14.80 meters from the white paper banner at center. Since the drone can fly up to 15 meters, it will be able to reach the banner as 14.80 meters is within the drone" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7c5f93a8fc11fc6.jpg", "conversations": [ { "from": "human", "value": "\nBetween silver metallic tripod at right and red fabric cap at upper center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "Positioned to the right is red fabric cap at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1772e7c666043ef3.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, black satin suit at center or dark gray suit at center, stands shorter?" }, { "from": "gpt", "value": "Standing shorter between the two is dark gray suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a01f26ee3bc88a7b.jpg", "conversations": [ { "from": "human", "value": "\nHow close is brown polished stone effigy at lower center from camera?" }, { "from": "gpt", "value": "They are 26.16 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09f564c809fc86ee.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the metallic gray frame at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.739, 0.209)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50755a818f62c706.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte black jacket at upper center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.387, 0.147)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5cc8ccfcd6996348.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator trying to capture a photo of the group in the camping scene. The drone is currently hovering at point coordinates of 0.5, 0.5. To get the best shot, you need to adjust the drone to the same position as the green grass at center. What coordinates should you set the drone to?" }, { "from": "gpt", "value": "The green grass at center is located at position coordinates of (0.068, 0.745). Therefore, to align the drone with the green grass at center for the best shot, you should set the drone to those coordinates." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36203c506ab292a0.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.150, 0.177) less distant than point (0.982, 0.198)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71d58c4e0cd34c73.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in a park and see the denim jacket at center and the green grass at lower center. Which object is closer to you?" }, { "from": "gpt", "value": "The denim jacket at center is closer to you than the green grass at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72a87814c5fa54d9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte red shirt at left is bigger than yellow rubber tube at center?" }, { "from": "gpt", "value": "Correct, matte red shirt at left is larger in size than yellow rubber tube at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc50cffafd550845.jpg", "conversations": [ { "from": "human", "value": "\nIs pink satin dress at center wider than matte denim overalls at left?" }, { "from": "gpt", "value": "Incorrect, pink satin dress at center's width does not surpass matte denim overalls at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ade6a4c3da8bd03.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of white feathered bird at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.543, 0.647)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d7bcd62931ca1a6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white paper sign at upper left is smaller than matte orange poster at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ad7e4ba6b2faf5b.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of black matte scuba gear at upper center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.749, 0.242)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10a6d8b5dc2b0e88.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the purple silk scarf at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.722, 0.594)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7f63ce2aaf738d7.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray rough rock at upper center have a greater width compared to gray rock at center?" }, { "from": "gpt", "value": "Yes, gray rough rock at upper center is wider than gray rock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd11a5d43bbf8fae.jpg", "conversations": [ { "from": "human", "value": "\nDoes reddish-brown stone bridge at center have a greater width compared to brown stone bridge at center?" }, { "from": "gpt", "value": "Incorrect, reddish-brown stone bridge at center's width does not surpass brown stone bridge at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fda4415d72e7a8d1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a parent trying to choose between two jackets for your child. You see the matte brown jacket at upper left and the brown fleece jacket at upper left in the image. Which jacket is closer to the slide?" }, { "from": "gpt", "value": "The matte brown jacket at upper left is closer to the slide because it is only 4.08 inches away from the brown fleece jacket at upper left, but since both are at the upper left, their positions relative to the slide depend on their placement. However, the description only provides the distance between them, not their distance from the slide. Therefore, we cannot determine which is closer based on the given information." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73ed9432c1659186.jpg", "conversations": [ { "from": "human", "value": "\nYou are part of a photography team capturing the event. You need to position a camera to ensure both the matte black suit at center and the light gray suit at center are visible in the frame. Given their positions, which one should you focus on first to include both in the shot?" }, { "from": "gpt", "value": "The matte black suit at center is located below the light gray suit at center. To include both in the frame, focus on the light gray suit at center first as it is higher up, allowing the camera to capture the lower positioned matte black suit at center in the same shot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f798bd07064a84e2.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the mall and see a green wool coat at left and a matte black jacket at center. Which one is closer to the entrance of the mall?" }, { "from": "gpt", "value": "The green wool coat at left is closer to the entrance of the mall because it is positioned to the left of the matte black jacket at center, which implies it is nearer to the entrance based on their spatial arrangement." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7af51fa939c1a12d.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of light brown wooden signpost at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.028, 0.356)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3dddd9877570da45.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the conference hall and notice two points marked in the scene. The first point is at coordinate point (0.492, 0.695) and the second is at point (0.873, 0.639). Which point is closer to you?" }, { "from": "gpt", "value": "Point (0.492, 0.695) is closer to you because it is further to the viewer than point (0.873, 0.639)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92e5d81136eca95f.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.955, 0.406) come in front of point (0.800, 0.566)?" }, { "from": "gpt", "value": "No, it is behind (0.800, 0.566)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49f712afbf9da485.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.687, 0.928) from camera?" }, { "from": "gpt", "value": "They are 26.96 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0ace49643656afd.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a photo of both the white matte sweater at center and the matte red jacket at center in the image. Since you want to highlight both equally, which object should you adjust your focus to prioritize in terms of size to make them appear balanced in the final shot?" }, { "from": "gpt", "value": "The white matte sweater at center occupies less space than the matte red jacket at center. To balance their sizes in the photo, you should focus more on enlarging the white matte sweater at center or reducing the size of the matte red jacket at center in the composition." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/939ee6d15568c8ca.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery robot that needs to place a small package at point (0.410, 0.736). The package is 10 inches in diameter. Can you safely place it there without hitting any objects?" }, { "from": "gpt", "value": "The distance between point (0.410, 0.736) and the camera is 23.35 inches. Since the package is only 10 inches in diameter, there is enough space to place it safely without hitting any objects." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cae3483663461edd.jpg", "conversations": [ { "from": "human", "value": "\nIs chalkboard sign at center bigger than black t-shirt at center?" }, { "from": "gpt", "value": "Actually, chalkboard sign at center might be smaller than black t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc9abf0c6fe6c268.jpg", "conversations": [ { "from": "human", "value": "\nBetween smooth skin baby at center and dark brown eye at center, which one is positioned higher?" }, { "from": "gpt", "value": "dark brown eye at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83f220970191ccd3.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, floral fabric hands at center or metallic spoon at lower right, stands shorter?" }, { "from": "gpt", "value": "metallic spoon at lower right is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5a095e79016cb3a.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.685, 0.338)?" }, { "from": "gpt", "value": "black matte baseball cap at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8daadcc756903b57.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte blue top at center and gold metallic anklet at lower center, which one is positioned lower?" }, { "from": "gpt", "value": "gold metallic anklet at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f218f881f0b4a4f1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the position of the central figure in the image. You need to retrieve your camera from the leather jacket at right. How far do you have to walk to reach it?" }, { "from": "gpt", "value": "The camera is 52.29 feet away from the leather jacket at right, so you would need to walk approximately 52.29 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26de15e098f3780a.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange fleece jacket at right come in front of matte gray jacket at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5123ba886aa20c63.jpg", "conversations": [ { "from": "human", "value": "\nIs white fluffy cloud at upper center smaller than black leafy tree at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa071ab5487812d2.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.868, 0.613) positioned before point (0.471, 0.988)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03027f9e6d12a593.jpg", "conversations": [ { "from": "human", "value": "\nYou are a swimmer trying to reach the edge of the pool. You see the transparent blue water at lower center and the matte pink float at center. Which object is closer to the pool edge?" }, { "from": "gpt", "value": "The matte pink float at center is closer to the pool edge because the transparent blue water at lower center is positioned on its right side, meaning the float is nearer to the edge." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c724b95bf86e462.jpg", "conversations": [ { "from": "human", "value": "\nYou are driving a car that is 15 feet long. You are currently at point (0.522, 0.652). There is another car parked at the other point. Can your car fit between the two points without crossing the road?" }, { "from": "gpt", "value": "The two points are 298.57 feet apart. Since your car is only 15 feet long, it can easily fit between the two points without crossing the road." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec93503535af1252.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, matte brown wicker basket at center or black wood barrel at lower left?" }, { "from": "gpt", "value": "black wood barrel at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aea97c4ba80cd6f6.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the white jersey at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.230, 0.584)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65927943d299d478.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.388, 0.323)?" }, { "from": "gpt", "value": "woven wood picnic basket at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e70190b1e164679.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is glossy black puffer jacket at center from denim jeans at lower center?" }, { "from": "gpt", "value": "They are 10.09 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7a2dc66e7bbc579.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between dark blue fabric uniform at center and camera?" }, { "from": "gpt", "value": "dark blue fabric uniform at center and camera are 7.49 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f613692183d4172.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.652, 0.708) or (0.964, 0.755)?" }, { "from": "gpt", "value": "The point (0.652, 0.708) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0cf1d8bc81be1587.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.264, 0.408) positioned behind point (0.645, 0.570)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6e9cd14383bb468.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, blue fabric jacket at center or translucent plastic bottle at center?" }, { "from": "gpt", "value": "Positioned lower is blue fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0db7e2e2e63f21cf.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, matte red shirt at center or maroon fabric shorts at center?" }, { "from": "gpt", "value": "Positioned to the right is matte red shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c6c7a3c2f414463.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a white uniform at center. Pinpoint a point to the white uniform at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.502, 0.628)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/009994d5c5cb5a2b.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gold bus at center closer to the viewer compared to green grass at center?" }, { "from": "gpt", "value": "No, it is behind green grass at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a5ee35e9e572d37.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth concrete pavement at lower center is wider than metallic gray pole at right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01cdb100a59470ed.jpg", "conversations": [ { "from": "human", "value": "\nCould you measure the distance between white matte necklace at center and clear glass water at center?" }, { "from": "gpt", "value": "white matte necklace at center and clear glass water at center are 55.23 centimeters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c30de7c4fab2a298.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white sweater at center is smaller than black plastic microphone at center?" }, { "from": "gpt", "value": "Actually, white sweater at center might be larger than black plastic microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4058828a5534dbca.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any green grassy at lower center in the image." }, { "from": "gpt", "value": "[(0.486, 0.848)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af1795bdb25835ca.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the waterway and see the brown woven basket at left. How far away is it from you?" }, { "from": "gpt", "value": "The brown woven basket at left is 15.73 meters away from you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d13f5b609b482483.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.039, 0.258) from camera?" }, { "from": "gpt", "value": "Point (0.039, 0.258) and camera are 68.76 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e35adb79c7112dc1.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of green grass at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.483, 0.830)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65872de5a0eebfb6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the living room and want to turn off the orange matte lampshade at upper center. If you are 1.5 meters tall and can reach up to 2 meters from the ground, can you reach it?" }, { "from": "gpt", "value": "The orange matte lampshade at upper center is 1.67 meters away from camera. Since you can reach up to 2 meters, you can reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9995f7374409f0e5.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of light gray cotton shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.787, 0.748)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d90a84fdfe4085f9.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of white cotton shirt at center more distant than that of matte white shirt at center?" }, { "from": "gpt", "value": "No, it is in front of matte white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1a11680362e816e.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.493, 0.545) from camera?" }, { "from": "gpt", "value": "41.26 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a192b153bd2f071.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the green leafy hedge at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.084, 0.880)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1704e9814815a5eb.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to step onto the yellow concrete pavement at center. How far do you need to walk to reach it?" }, { "from": "gpt", "value": "The yellow concrete pavement at center is 3.86 meters away from the camera, so you need to walk 3.86 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc769607950ae70a.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.467, 0.791)?" }, { "from": "gpt", "value": "89.48 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c195091410e4d9c.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the dark brown leather jacket at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.197, 0.561)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08e88c77d53a2b20.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.201, 0.339) and point (0.735, 0.662), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.201, 0.339) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54ed5cddd935bed4.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a shiny silver sedan at right. Pinpoint a point to the shiny silver sedan at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.954, 0.211)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c7ad2b378aae05c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white paper airplane at center is shorter than white paper at lower left?" }, { "from": "gpt", "value": "Incorrect, white paper airplane at center's height does not fall short of white paper at lower left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/006e4e3f92746226.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, transparent skin hand at center or clear plastic bottle at center?" }, { "from": "gpt", "value": "transparent skin hand at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d9d71f0312044ed.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of dark gray textured sweater at upper right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.777, 0.287)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36fae0d11df5e5bd.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.850, 0.430) positioned after point (0.463, 0.416)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce9881b36714c4fd.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pet owner who wants to ensure your rabbits have easy access to their water bowl. Based on the scene, can the brown fur rabbit at center reach the white glossy bowl at lower right without moving from its current position?" }, { "from": "gpt", "value": "The brown fur rabbit at center is above the white glossy bowl at lower right, so it can easily reach the bowl without needing to move from its current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ecb79154156e663.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.212, 0.416) or (0.835, 0.477)?" }, { "from": "gpt", "value": "Point (0.835, 0.477)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41e6db8834bbc04f.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of green textured bush at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.037, 0.608)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab2799a19162e648.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth gray cat at center below black glossy monitor at upper left?" }, { "from": "gpt", "value": "Correct, smooth gray cat at center is located below black glossy monitor at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e289e4bf24433e11.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from bare branches at upper right to gold metallic dome at upper center." }, { "from": "gpt", "value": "bare branches at upper right and gold metallic dome at upper center are 36.49 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdba588c63d63f70.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy swan at right have a lesser width compared to white matte swan at center?" }, { "from": "gpt", "value": "No, white glossy swan at right is not thinner than white matte swan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7935ef61f8dacffa.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.826, 0.973) or (0.306, 0.431)?" }, { "from": "gpt", "value": "Point (0.826, 0.973) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da4214f6961ef822.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of checkered fabric shirt at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.179, 0.695)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/397b06f29d2cdb8e.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of orange matte tangerine at center from orangesmoothorange segment at center?" }, { "from": "gpt", "value": "8.70 inches" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fd007d630a5f697.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the dark gray sweater at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.270, 0.753)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/978691ebd6c9be8c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the scene of a person interacting with a car. Given that the dark striped sweater at center and the metallic gold car at upper center are both in the frame, which object should you focus on to ensure the larger subject is properly highlighted?" }, { "from": "gpt", "value": "The metallic gold car at upper center should be focused on because it occupies more space than the dark striped sweater at center, making it the larger subject in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e21f386681fc6807.jpg", "conversations": [ { "from": "human", "value": "\nYou are a parade attendee who wants to hand a flower to the person in the metallic gold helmet at center from your current position near the gold metallic wheelchair at center. Is the distance between them within your comfortable throwing range?" }, { "from": "gpt", "value": "The distance between the metallic gold helmet at center and the gold metallic wheelchair at center is 6.04 meters. A comfortable throwing range for a flower is typically around 5 meters, so you may struggle to accurately throw the flower that far. It might be better to walk closer or ask someone else to pass it along." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fab4bf68152aabac.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, green grass at center or blue striped polo shirt at center?" }, { "from": "gpt", "value": "green grass at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d28ff6c105dc8f03.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.814, 0.798) or (0.204, 0.289)?" }, { "from": "gpt", "value": "Point (0.204, 0.289)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9681bc8e7697452.jpg", "conversations": [ { "from": "human", "value": "\nYou are designing a garden layout and need to place a new flower bed along the brick paved walkway at center. Considering the smooth red bench at right is already there, can you determine if the walkway is wide enough to accommodate a 2 meter wide flower bed on its left side?" }, { "from": "gpt", "value": "The brick paved walkway at center is wider than the smooth red bench at right. Since the bench is on the right side, the walkway has enough space on its left side to accommodate a 2 meter wide flower bed." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbcb55f2428a90d1.jpg", "conversations": [ { "from": "human", "value": "\nLocate all brown and white fur cat at left in the image." }, { "from": "gpt", "value": "[(0.282, 0.492)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92e87bf2a920e793.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.878, 0.644) or point (0.081, 0.420)?" }, { "from": "gpt", "value": "Point (0.081, 0.420)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90744bf676f41c4f.jpg", "conversations": [ { "from": "human", "value": "\nIs blue water at center wider than metallic gray ship at center?" }, { "from": "gpt", "value": "Yes, blue water at center is wider than metallic gray ship at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/604e72bd016c70c7.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.561, 0.533)?" }, { "from": "gpt", "value": "15.96 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/517e433e6fc47b83.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.098, 0.487) or point (0.354, 0.397)?" }, { "from": "gpt", "value": "Point (0.098, 0.487) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8375c3a742f82608.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white glossy train at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.521, 0.484)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b8d1040d1e91c97.jpg", "conversations": [ { "from": "human", "value": "\nBetween clear plastic billboard at upper center and matte red sedan at center, which one has less height?" }, { "from": "gpt", "value": "With less height is matte red sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79da5fa339b70d8e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.697, 0.361) or point (0.053, 0.838)?" }, { "from": "gpt", "value": "Positioned behind is point (0.053, 0.838)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2946fbd3c9e58baa.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance from purple satin suit at center to green wool suit at center." }, { "from": "gpt", "value": "The distance of purple satin suit at center from green wool suit at center is 23.83 inches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b60d2a7b7f9d8656.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tour guide at the marina and want to direct visitors to the white glossy yacht at center. You see the white glossy boat at right nearby. Which direction should visitors turn to find the yacht?" }, { "from": "gpt", "value": "The white glossy yacht at center is to the left of the white glossy boat at right, so visitors should turn left to find the yacht." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/750c0284a3435290.jpg", "conversations": [ { "from": "human", "value": "\nHow far is neon yellow fabric jacket at center from blue fabric jacket at upper right?" }, { "from": "gpt", "value": "29.45 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad11c7ae1a7e4292.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte pink dress at left appear over light brown wooden bridge at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/651ac200993343c5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer in the convenience store and want to find the soft cover manga at lower right. Based on the store layout, where should you look relative to the refrigerator on the left?" }, { "from": "gpt", "value": "The soft cover manga at lower right is located at the lower right area of the image, which is opposite to the refrigerator on the left. Since the refrigerator is on the left side, you should look towards the right side of the store to find the soft cover manga at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/704d118ce3de33a8.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white paper at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.262, 0.347)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c53ac43a9619745.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if stone gray tower at center is positioned below stone tower at center?" }, { "from": "gpt", "value": "Actually, stone gray tower at center is above stone tower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90e40ac8538ff15b.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to install a fence between the brown leafless tree at center and the green textured tree at upper center. The fence panels you have are each 10 feet long. How many panels do you need to span the distance between them?" }, { "from": "gpt", "value": "The distance between the brown leafless tree at center and the green textured tree at upper center is 68.88 feet. Each fence panel is 10 feet long, so dividing 68.88 by 10 gives approximately 6.888 panels. Since you can only use whole panels, you would need 7 panels to cover the distance between them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a58143c1c5a19dd6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the image and want to walk towards the smooth brown tree trunk at right. Which direction should you face to head directly towards it?" }, { "from": "gpt", "value": "To head directly towards the smooth brown tree trunk at right, you should face towards the right since its 2D location is at point (0.912, 0.536), which is positioned to the right side of the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20757c542a24c5ce.jpg", "conversations": [ { "from": "human", "value": "\nYou are a chef preparing a vegetable arrangement. You have an orange smooth carrot at center and orange matte carrots at center in front of you. Which carrot should you choose if you want the one that is closer to you?" }, { "from": "gpt", "value": "The orange smooth carrot at center is closer because it is in front of the orange matte carrots at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc21834c2f71b4a4.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.392, 0.716) or point (0.815, 0.592)?" }, { "from": "gpt", "value": "Point (0.392, 0.716) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00af217a66b8d5c0.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white satin suit at upper right located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.721, 0.594)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad28d315191b8d7f.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any curly hair at center in the image." }, { "from": "gpt", "value": "[(0.175, 0.752)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03ae732008c3f60e.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of blonde hair at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.340, 0.338)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad75bce65989c5d8.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, brushed metal tractor at left or white lace dress at center?" }, { "from": "gpt", "value": "white lace dress at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1bf973ecb66be9e1.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.686, 0.441) farther from camera compared to point (0.469, 0.595)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa518d21643b784e.jpg", "conversations": [ { "from": "human", "value": "\nIs black glossy dress at center taller than light brown wooden guitar at center?" }, { "from": "gpt", "value": "Yes, black glossy dress at center is taller than light brown wooden guitar at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd6f6bb6feb6e559.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.595, 0.952) more distant than point (0.354, 0.436)?" }, { "from": "gpt", "value": "No, it is in front of (0.354, 0.436)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82f5d908456bac04.jpg", "conversations": [ { "from": "human", "value": "\nYou are a firefighter in the scene and need to locate the point at coordinates (0.153, 0.367). According to the scene description, where exactly would this point be located?" }, { "from": "gpt", "value": "The point at coordinates (0.153, 0.367) is on the matte red helmet at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b61c02ef4a066731.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the water and see the point marked at coordinates (0.769, 0.339). Which object in the scene is that point located on?" }, { "from": "gpt", "value": "The point marked at coordinates (0.769, 0.339) is located on the weathered wood hut at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69fa5b989e25fbb2.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.549, 0.731) and point (0.531, 0.372), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.531, 0.372) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1041d3a30b21f37.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.389, 0.794) or (0.022, 0.048)?" }, { "from": "gpt", "value": "Positioned behind is point (0.022, 0.048)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9c7ee3c4156a1b7.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the garden and want to find the beige corduroy pants at right. Based on the coordinates provided, in which direction should you look relative to the other people on the bench?" }, { "from": "gpt", "value": "The beige corduroy pants at right is located at point 0.553 on the x and 0.858 on the y, which places it towards the right side of the image. Since the individuals are seated on a bench from left to right, you should look to the rightmost part of the bench to find the beige corduroy pants at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f736ebefc4b0a7f.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the smooth brown bowl at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.151, 0.700)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3113c7a2a8c33361.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.339, 0.373) come in front of point (0.632, 0.945)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf50bcff6b8bab44.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red jacket at center have a lesser height compared to camouflage fabric helmet at upper center?" }, { "from": "gpt", "value": "Indeed, matte red jacket at center has a lesser height compared to camouflage fabric helmet at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6680415a59d87fc.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer taking a picture of the scene. You notice the denim shorts at center and the brown leather boot at center in your frame. Which object is positioned higher in the image?" }, { "from": "gpt", "value": "The denim shorts at center is above the brown leather boot at center in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b94da229e2db2494.jpg", "conversations": [ { "from": "human", "value": "\nYou are looking at the bowl of apples and want to place a sticker on both point (0.704, 0.619) and point (0.438, 0.581). Which point is closer to you?" }, { "from": "gpt", "value": "Point (0.438, 0.581) is closer to you because it is less further than point (0.704, 0.619)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6adc0d77a9be13a0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if striped cotton shirt at center is wider than white fleece jacket at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5b1aac0ba3dcdec.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.739, 0.383) or (0.101, 0.342)?" }, { "from": "gpt", "value": "Positioned in front is point (0.101, 0.342)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/754da5d53a230036.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.079, 0.466) more distant than point (0.475, 0.308)?" }, { "from": "gpt", "value": "Yes, point (0.079, 0.466) is behind point (0.475, 0.308)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27753a26d20ed565.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.580, 0.811) and point (0.143, 0.894), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.580, 0.811)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9b33c09d7c65542.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.916, 0.931) or point (0.409, 0.492)?" }, { "from": "gpt", "value": "The point (0.409, 0.492) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2629f30e54b56f6e.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny red hair at center have a larger size compared to shiny green necklace at lower right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6be31e22ae89cbe.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the matte brown shotgun at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.182, 0.655)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d463b7e7232fe8c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte red hatchback at lower left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.134, 0.925)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c92fdbe2ce32a637.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the wooden fence at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.510, 0.908)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a21cf7a62301d362.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.176, 0.103) or point (0.507, 0.720)?" }, { "from": "gpt", "value": "Positioned behind is point (0.507, 0.720)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5a910f5e9cbebe0.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.027, 0.914) or point (0.249, 0.870)?" }, { "from": "gpt", "value": "Point (0.027, 0.914) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c9c8f17f01103c7.jpg", "conversations": [ { "from": "human", "value": "\nIs denim shorts at left taller than green plaid shirt at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eeb1f63e944880d1.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.723, 0.422) closer to viewer compared to point (0.475, 0.681)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/643b986941b77cdc.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.427, 0.542) and camera?" }, { "from": "gpt", "value": "Point (0.427, 0.542) is 8.37 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a51cc5ddeab2beaf.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the water in the sunset scene. There are two points marked in the image. Which point, point (0.056, 0.908) or point (0.349, 0.512), is closer to you?" }, { "from": "gpt", "value": "Point (0.056, 0.908) is closer to the viewer than point (0.349, 0.512)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/405e07a5d78a5793.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the back of the classroom. You want to take a photo that includes both the white cotton shirt at center and the white matte shirt at upper right. Given that your camera has a maximum focus range of 5 meters, will you be able to capture both shirts in focus?" }, { "from": "gpt", "value": "The distance between the white cotton shirt at center and the white matte shirt at upper right is 4.75 meters, which is within the camera maximum focus range of 5 meters. Therefore, you can capture both shirts in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee05c03bfe235bd2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a station attendant and need to determine if the red glossy train at center can pass through a narrow corridor that is only as wide as the translucent glass globe at center. Based on their widths, can the train safely pass through the corridor?" }, { "from": "gpt", "value": "The red glossy train at center is wider than the translucent glass globe at center, so it cannot safely pass through the corridor which is only as wide as the globe." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/393d88d7b3d2e77d.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, wooden table at center or crumbly brown topping at center?" }, { "from": "gpt", "value": "From the viewer's perspective, crumbly brown topping at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c854f83b32ee5493.jpg", "conversations": [ { "from": "human", "value": "\nLocate the red cotton shirt at right in the image." }, { "from": "gpt", "value": "[(0.902, 0.559)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85ed923e86645b26.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the matte black shirt at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.959, 0.444)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/822113f22095f830.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white fabric tent at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.273, 0.828)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e25e922014fb80ef.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from green fabric bag at lower left to camera." }, { "from": "gpt", "value": "green fabric bag at lower left and camera are 55.56 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75b0f7a4d5fc7697.jpg", "conversations": [ { "from": "human", "value": "\nIs hardcover books at center to the left of white matte littlefreelibrary sign at left from the viewer's perspective?" }, { "from": "gpt", "value": "In fact, hardcover books at center is to the right of white matte littlefreelibrary sign at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ede112fea449530.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte laptop at left is wider than silver metallic laptop at center?" }, { "from": "gpt", "value": "Correct, the width of black matte laptop at left exceeds that of silver metallic laptop at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0b2c52012210baf.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white cotton t-shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.308, 0.662)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ccc95f47b8675384.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture both the matte black suit at center and the matte black suit at left in a single frame. Since the camera has a fixed focus, you need to ensure both subjects are in the same focal plane. Given their sizes, which one should you focus on to maximize clarity for both?" }, { "from": "gpt", "value": "You should focus on the matte black suit at center because it is larger and will require more precise focus to maintain clarity, ensuring the smaller matte black suit at left also stays sharp." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5fd847a068cf2b0.jpg", "conversations": [ { "from": "human", "value": "\nHow close is brown stone church at center from green leafy tree at upper left?" }, { "from": "gpt", "value": "brown stone church at center is 12.54 meters away from green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47bade4479eeeb82.jpg", "conversations": [ { "from": "human", "value": "\nLocate navy satin gown at lower left in the image." }, { "from": "gpt", "value": "[(0.083, 0.811)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3dbee2a5a56fa99.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker standing at the base of the dark brown spiky palm tree at center. You want to reach the silvery gray mountain at center. How far do you need to travel in feet?" }, { "from": "gpt", "value": "The silvery gray mountain at center is 125.99 feet from the dark brown spiky palm tree at center, so you need to travel 125.99 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6819dadf6d8e90ad.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a matte black suit at center. Pinpoint a point to the matte black suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.245, 0.613)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d545bd1ddf9d97d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a passenger in the safari vehicle parked on the dirt path. You notice two points marked on the ground ahead of you. The first point is at coordinates point (0.196, 0.438) and the second is at point (0.980, 0.972). From your perspective in the vehicle, which point is closer to you?" }, { "from": "gpt", "value": "Point (0.980, 0.972) is closer to you because the description states that point (0.196, 0.438) is behind point (0.980, 0.972), meaning the latter is nearer to your current position in the vehicle." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/669b140761a93519.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.308, 0.931) in front of point (0.420, 0.909)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e4421262442e9ec.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.002, 0.942) from camera?" }, { "from": "gpt", "value": "Point (0.002, 0.942) and camera are 1.04 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a15976869e1531c3.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.254, 0.878) come behind point (0.826, 0.602)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb16396f405ee06e.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of black matte jacket at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.733, 0.641)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcc67fad71c60d41.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of wooden skateboard at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.591, 0.298)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd867ff9911090f6.jpg", "conversations": [ { "from": "human", "value": "\nBetween gray fleece vest at center and blue metallic can at center right, which one is positioned higher?" }, { "from": "gpt", "value": "gray fleece vest at center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84c057cb87db15e7.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green leafy tree at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.278, 0.202)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28b3bf2b738c8a11.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of white plastic license plate at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.175, 0.723)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0265bcbac397301.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.032, 0.338) behind point (0.757, 0.761)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b18be157cff53dd8.jpg", "conversations": [ { "from": "human", "value": "\nCould you provide the distance between brown metal train track at center and matte red locomotive at center?" }, { "from": "gpt", "value": "brown metal train track at center and matte red locomotive at center are 29.84 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3ffb51704327b3a.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between green leafy tree at right and green grassy field at center." }, { "from": "gpt", "value": "green leafy tree at right and green grassy field at center are 12.77 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae8ddd293c688c80.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark suit at center have a lesser width compared to matte beige shirt at center?" }, { "from": "gpt", "value": "Indeed, dark suit at center has a lesser width compared to matte beige shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc12ef9c929e8f88.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte beige dress at left have a larger size compared to polka dot fabric dress at center?" }, { "from": "gpt", "value": "Correct, matte beige dress at left is larger in size than polka dot fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d14de09252979d1.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center wider than rusty wood hut at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe4f1be179a6465b.jpg", "conversations": [ { "from": "human", "value": "\nDoes light brown wood flooring at center have a greater height compared to clear glass sliding doors at left?" }, { "from": "gpt", "value": "No, light brown wood flooring at center is not taller than clear glass sliding doors at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2fee84fe8e5ecdb1.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.301, 0.695) or point (0.180, 0.717)?" }, { "from": "gpt", "value": "Positioned behind is point (0.180, 0.717)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96fc6e7ee572452a.jpg", "conversations": [ { "from": "human", "value": "\nLocate all orange checkered shirt at left in the image." }, { "from": "gpt", "value": "[(0.245, 0.600)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fa4956703b330da.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white satin shirt at left is positioned above black plastic goggles at left?" }, { "from": "gpt", "value": "No, white satin shirt at left is not above black plastic goggles at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a6bb49749b99a98.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.728, 0.637) closer to camera compared to point (0.263, 0.477)?" }, { "from": "gpt", "value": "Yes, point (0.728, 0.637) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/573bfed57197b098.jpg", "conversations": [ { "from": "human", "value": "\nYou are a spectator at the game and want to find the point marked at coordinates (0.562, 0.764). Where should you look in the arena?" }, { "from": "gpt", "value": "The point marked at coordinates (0.562, 0.764) is located on the wooden basketball court at center. So you should look at the center of the court where the San Antonio Spurs logo is displayed." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0018c38c024185ba.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green matte tree at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.775, 0.944)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37c18893450b1686.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.086, 0.845) or point (0.610, 0.959)?" }, { "from": "gpt", "value": "Point (0.086, 0.845) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7caf22ceac17fa7.jpg", "conversations": [ { "from": "human", "value": "\nCould you measure the distance between clear water at bridge center and light brown leather jacket at upper left?" }, { "from": "gpt", "value": "A distance of 25.98 meters exists between clear water at bridge center and light brown leather jacket at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0152d93cbd14457d.jpg", "conversations": [ { "from": "human", "value": "\nIs fuzzy black and white ostrich at center taller than fuzzy black ostrich at center?" }, { "from": "gpt", "value": "Yes, fuzzy black and white ostrich at center is taller than fuzzy black ostrich at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd398569a1bcc3f2.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte khaki suit at center and green cotton shirt at center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "green cotton shirt at center is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29e656b086efc9f2.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.561, 0.644) closer to camera compared to point (0.157, 0.508)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b397ab6e8f2f9990.jpg", "conversations": [ { "from": "human", "value": "\nHow close is smooth stone houses at upper center from camera?" }, { "from": "gpt", "value": "smooth stone houses at upper center and camera are 267.00 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85ed923e86645b26.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the beach and want to place a new bench. The bench must be placed such that it is exactly halfway between the white fabric bag at center and the ocean. Where should you place the bench?" }, { "from": "gpt", "value": "The bench should be placed halfway between the white fabric bag at center and the ocean. Since the white fabric bag at center is located at point (0.837, 0.770), the bench should be placed along the line connecting it to the ocean, exactly halfway between those two points." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a34172e4219c043.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton shirt at left positioned before striped fabric at center?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb4a2d0be265fb76.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance from green leafy tree at center to green leafy tree at upper left." }, { "from": "gpt", "value": "22.32 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8cf1a7f26850cb9.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.936, 0.597) come in front of point (0.368, 0.730)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77e253ac902c001e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.846, 0.566)?" }, { "from": "gpt", "value": "rusty metal garbage truck at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c7bcc8f8046b82c.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of blue water at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.243, 0.909)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e4807b4e0954bdb.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of autumn leaves at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.448, 0.153)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55aaae12c90628ab.jpg", "conversations": [ { "from": "human", "value": "\nYou are at a party and see two people in the image. The black hair at right and the white cotton shirt at left are part of the scene. Which object is positioned to the right of the other?" }, { "from": "gpt", "value": "The black hair at right is to the right of the white cotton shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/446fd87c793ff5ec.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.573, 0.122)?" }, { "from": "gpt", "value": "metallic gray roof at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7714babddeaf7ed.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte shirt at left is bigger than black textured sweater at right?" }, { "from": "gpt", "value": "Actually, black matte shirt at left might be smaller than black textured sweater at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04ac5ca55ac606ef.jpg", "conversations": [ { "from": "human", "value": "\nYou have a cat toy that is 10 inches long. You want to place it on the fuzzy charcoal cat bed at center where the black fur cat at center is resting. Can the cat toy fit on the bed without overlapping the cat?" }, { "from": "gpt", "value": "The fuzzy charcoal cat bed at center might be wider than black fur cat at center, so there is a possibility that the cat toy can fit on the bed without overlapping the cat. However, the exact dimensions are uncertain based on the provided information." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9626b8bdd06ad19f.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of purple matte apple at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.386, 0.291)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4709f897f1f6c26.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to take a photo of the metallic gray stairs at center and the matte black backpack at center at the Eiffel Tower. Which object should you focus on first if you want to capture both in a single frame without moving the camera?" }, { "from": "gpt", "value": "You should focus on the metallic gray stairs at center first because it is shorter than the matte black backpack at center, allowing you to position it lower in the frame while still including the taller backpack." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9daa995336ba8c32.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, black marble vanity at lower center or gold ornate mirror at center, stands shorter?" }, { "from": "gpt", "value": "black marble vanity at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdb97b12b544d370.jpg", "conversations": [ { "from": "human", "value": "\nYou are trying to place the velvet brown jacket at center on the brown fabric table at center. Based on their sizes, will the jacket fit entirely on the table?" }, { "from": "gpt", "value": "The brown fabric table at center has a larger width than the velvet brown jacket at center, so the jacket will fit entirely on the table." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/160433473bfd3e2e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.583, 0.527)?" }, { "from": "gpt", "value": "yellow matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae4183d41991bd28.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room and want to walk towards the black matte shirt at center. What direction should you move in relative to the door on the left side of the frame?" }, { "from": "gpt", "value": "The black matte shirt at center is positioned at point (0.701, 0.503), so you should move towards the center of the room away from the door on the left side of the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ba7b9a9b55f513a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow matte jacket at center is positioned below blue fleece jacket at right?" }, { "from": "gpt", "value": "Correct, yellow matte jacket at center is located below blue fleece jacket at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5df0cecf90b08290.jpg", "conversations": [ { "from": "human", "value": "\nYou are a parent trying to decide where to place a new toy box in the backyard. The toy box is the same size as the white cotton hat at upper right. Based on the image, can the toy box fit on the white plastic table at center without overlapping the bowls and cup?" }, { "from": "gpt", "value": "The white plastic table at center has a larger size compared to white cotton hat at upper right, so the toy box can fit on the white plastic table at center as long as there is enough space not occupied by the bowls and cup." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb49bb80809700ba.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to avoid puddles while walking down the street. You see the smooth concrete pavement at center and the wet asphalt at center. Which surface should you walk on to stay dry?" }, { "from": "gpt", "value": "The smooth concrete pavement at center is positioned on the right side of wet asphalt at center. Since the asphalt is wet, you should walk on the smooth concrete pavement at center to avoid getting wet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98b3bacbd90c8c0e.jpg", "conversations": [ { "from": "human", "value": "\nDoes light beige fabric dress at left have a lesser width compared to black floral dress at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a160c0a6cf34036f.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, matte black coat at center or matte black jacket at lower left?" }, { "from": "gpt", "value": "Positioned to the left is matte black jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54737e48e308eca9.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point labeled as point (0.713, 0.750) in the image. What is the nearest object to you?" }, { "from": "gpt", "value": "The point (0.713, 0.750) is on green leafy bush at center, so the nearest object to you is the green leafy bush at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fc52af6c1953fa8.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between matte plastic doll at center and camera?" }, { "from": "gpt", "value": "matte plastic doll at center is 34.23 inches from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d6b5afec376570a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a gardener who needs to trim the green leafy hedge at upper center and the bronze textured manhole cover at center. Which object requires a ladder to reach its top?" }, { "from": "gpt", "value": "The green leafy hedge at upper center requires a ladder to reach its top because it is taller than the bronze textured manhole cover at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de670c72183d5c25.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, gold textured dress at center or light brown textured dress at center?" }, { "from": "gpt", "value": "light brown textured dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec3c253c2492b320.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the transparent teal car at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.790, 0.866)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39aa0f24a4036db5.jpg", "conversations": [ { "from": "human", "value": "\nDoes whitematerial/textureflag at center have a smaller size compared to white cotton shirt at upper center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99ab6b00d5e16fb2.jpg", "conversations": [ { "from": "human", "value": "\nDoes floral fabric hat at center appear under smooth brown suit at center?" }, { "from": "gpt", "value": "Correct, floral fabric hat at center is located below smooth brown suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd8724aa1cbd6346.jpg", "conversations": [ { "from": "human", "value": "\nIs blue t-shirt at lower left positioned at the back of blue fabric person at lower left?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd922f5bae6a6f6e.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray rough rock at center right have a greater height compared to clear water at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/606d973a2afef747.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in a pasture and see the speckled white cow at center and the brown leather bull at right. Which direction should you walk to get closer to both animals while staying between them?" }, { "from": "gpt", "value": "Walk towards the left side of the brown leather bull at right, as the speckled white cow at center is to the left of the brown leather bull at right, so staying between them would require positioning yourself to the left of the bull." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53caea978a0a6dc8.jpg", "conversations": [ { "from": "human", "value": "\nHow close is green leafy tree at upper right from orange metallic tow truck at center?" }, { "from": "gpt", "value": "They are 7.36 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/339505345a663b62.jpg", "conversations": [ { "from": "human", "value": "\nLocate all black matte suv at right in the image." }, { "from": "gpt", "value": "[(0.790, 0.708)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90c9d12b95d8df56.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.208, 0.303) closer to camera compared to point (0.226, 0.498)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90e7de9f04a0fb6a.jpg", "conversations": [ { "from": "human", "value": "\nLocate the black matte cap at upper center in the image." }, { "from": "gpt", "value": "[(0.811, 0.823)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21c5f0ada945ff6f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray sweater at center is positioned below plaid shirt at left?" }, { "from": "gpt", "value": "Incorrect, dark gray sweater at center is not positioned below plaid shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f070828ff13b8e54.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.123, 0.688) to camera." }, { "from": "gpt", "value": "They are 13.05 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ea3d66f59ee2d6f.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte shirt at center have a lesser width compared to brown textured shirt at right?" }, { "from": "gpt", "value": "Indeed, white matte shirt at center has a lesser width compared to brown textured shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26ad42f2e73a17f1.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.768, 0.700) lie behind point (0.818, 0.648)?" }, { "from": "gpt", "value": "No, (0.768, 0.700) is in front of (0.818, 0.648)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21105175a08dc459.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, green leafy tree at center or brown dirt track at center, stands shorter?" }, { "from": "gpt", "value": "Standing shorter between the two is green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/758120a4e2e86bc2.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white glossy counter top at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.538, 0.947)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5158200d5157eba.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator trying to capture a photo of the construction site. The camera is currently positioned to focus on the brown bark trees at upper left. To ensure the entire scene is visible, should you pan the camera to the left or right?" }, { "from": "gpt", "value": "The brown bark trees at upper left are located at point (0.192, 0.216), so panning the camera to the right would help capture more of the construction site in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b10d7a57b3e0453.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the dark matte helicopter at upper center and the white glossy boat at upper left in a single shot. Given that your camera has a limited field of view, which object should you prioritize framing first to ensure both are in the shot?" }, { "from": "gpt", "value": "The dark matte helicopter at upper center is larger in width than the white glossy boat at upper left, so you should prioritize framing the dark matte helicopter at upper center first to ensure both fit within the camera frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac25addb8cf02574.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.160, 0.848) or (0.131, 0.984)?" }, { "from": "gpt", "value": "Point (0.160, 0.848) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47f2270bfd27d2ca.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the middle of the salt pans and looking up. Which direction should you face to see the cloudy sky at upper center?" }, { "from": "gpt", "value": "The cloudy sky at upper center is located at coordinates approximately 0.678 along the x axis and 0.578 along the y axis, so you should look upwards and slightly to the right to see it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbc2fa759f2577e2.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black plastic wheelchair at lower left located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.173, 0.908)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14cab664a1e7c295.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the green grass at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.259, 0.886)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19c8482f1dbe0ed0.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.702, 0.633) and point (0.749, 0.225), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.749, 0.225)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7f1eafc5a7b9d2a.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of matte white robe at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.080, 0.528)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0331c160631af3d1.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the rural field and see the green grass at lower center and the gray fabric pants at left. Which object is positioned to the right of the other?" }, { "from": "gpt", "value": "The green grass at lower center is positioned to the right of the gray fabric pants at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/795e948523df0a5a.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between white smooth pillar at center and camera?" }, { "from": "gpt", "value": "white smooth pillar at center and camera are 5.61 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95d8c91bd72ca92c.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.587, 0.125) come farther from viewer compared to point (0.596, 0.561)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b7de286b6914a33.jpg", "conversations": [ { "from": "human", "value": "\nIs green rough bark tree at center bigger than green leafy tree at center?" }, { "from": "gpt", "value": "Yes, green rough bark tree at center is bigger than green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd1203ee76fd9334.jpg", "conversations": [ { "from": "human", "value": "\nYou are a bartender who needs to reach for the brown matte plastic cup at upper right without touching the skinny white arm at upper center. Can you do this easily?" }, { "from": "gpt", "value": "The skinny white arm at upper center is positioned on the left side of the brown matte plastic cup at upper right, so there is space to the right of the arm to reach the cup without touching it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1df8bd3662331006.jpg", "conversations": [ { "from": "human", "value": "\nDoes suede/velvet high-heeled shoe at center appear under suede/velvet high-heeled shoe at lower left?" }, { "from": "gpt", "value": "Actually, suede/velvet high-heeled shoe at center is above suede/velvet high-heeled shoe at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2987974755a299b9.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of dark blue jeans at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.589, 0.477)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ef92f5d492841f9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if silver metallic flute at center is thinner than silver/metallic flute at center?" }, { "from": "gpt", "value": "Indeed, silver metallic flute at center has a lesser width compared to silver/metallic flute at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39c82e09b856cb58.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden canoe at right taller than wooden paddle at lower center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee0ba600519aa812.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.754, 0.552)?" }, { "from": "gpt", "value": "Point (0.754, 0.552) is 5.41 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b5f6e5fad97a2d6.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green leafy hedge at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.188, 0.747)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e7b00feab038db1.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.853, 0.339) behind point (0.593, 0.280)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a2361f77ea4fd66.jpg", "conversations": [ { "from": "human", "value": "\nIs teal matte bench at lower left below white glossy corridor at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d37f90c2ded938ef.jpg", "conversations": [ { "from": "human", "value": "\nIs rough bark tree trunk at center wider than green matte grapes at right?" }, { "from": "gpt", "value": "Indeed, rough bark tree trunk at center has a greater width compared to green matte grapes at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e83c6565eacd3ba.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the striped fabric shirt at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.171, 0.591)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87300be2b273f34c.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to white paper at upper center? Please provide its 2D coordinates.Where can I find white paper at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.354, 0.216)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83ff21a9003baa1e.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of green matte christmas tree at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.483, 0.159)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ff367285515dc36.jpg", "conversations": [ { "from": "human", "value": "\nIs black satin dress at center smaller than white fabric flower at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/658c0beae45c7433.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.049, 0.450) and camera." }, { "from": "gpt", "value": "Point (0.049, 0.450) is 2.24 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54c77d2dd7d59c2b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.472, 0.547) or point (0.822, 0.289)?" }, { "from": "gpt", "value": "Point (0.822, 0.289)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9dd450c158de945.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the blue printed scarf at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.788, 0.806)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd1a517dafe03d04.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the bridge and want to place a small boat in the scene. The boat requires a space wider than the green leafy tree at center to float. Can the clear water at center accommodate the boat?" }, { "from": "gpt", "value": "The clear water at center has a width larger than the green leafy tree at center, so yes, the boat can float there as it provides sufficient space." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd379e942f3c7d01.jpg", "conversations": [ { "from": "human", "value": "\nLocate black suit at right in the image." }, { "from": "gpt", "value": "[(0.944, 0.562)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd56fe2cbc746f36.jpg", "conversations": [ { "from": "human", "value": "\nYou are an interior designer planning to install a new wall art piece between the stained glass window at upper center and the matte glass lamp at upper left. Given their widths, which object should you consider for placement adjustments to ensure the art fits properly?" }, { "from": "gpt", "value": "The stained glass window at upper center is wider than the matte glass lamp at upper left. To ensure proper placement, adjust the position of the stained glass window at upper center to accommodate the wall art piece." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c13de88a4946e75b.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a photo shoot and need to determine the best position for a spotlight. The spotlight needs to be placed where the floral skirt at center and the matte black dress at center are both visible. Based on their widths, which object should be closer to the center of the spotlight to ensure both are fully illuminated?" }, { "from": "gpt", "value": "The floral skirt at center is thinner than the matte black dress at center, so the spotlight should be positioned closer to the floral skirt at center to ensure both are fully illuminated." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b0abe6d7edd3d1f.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the green grass at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.510, 0.833)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77f21222c86965b3.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of green rubber hose at right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.926, 0.559)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2319b88019deae4e.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.941, 0.398) come behind point (0.700, 0.400)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c067ecf6b4f27786.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at a formal event. You need to capture a photo of the black silk suit at left and the gold dotted tie at right. Based on their positions, which object should you focus on first to ensure both are in frame?" }, { "from": "gpt", "value": "The black silk suit at left is above the gold dotted tie at right, so you should focus on the gold dotted tie at right first to ensure both are in frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e5b693d13910df5.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.025, 0.770) from camera?" }, { "from": "gpt", "value": "Point (0.025, 0.770) and camera are 5.00 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c8af19da6a730be.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.620, 0.494)?" }, { "from": "gpt", "value": "stone textured building at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9c6c8190f1ad308.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tourist standing at the base of the CN Tower and want to take a photo that includes both the concrete tower at center and the gray concrete skyscraper at right. Which object should you position closer to the center of your camera frame to ensure both are fully visible?" }, { "from": "gpt", "value": "You should position the concrete tower at center closer to the center of your camera frame because it is bigger than the gray concrete skyscraper at right, allowing both to fit within the frame when the larger object is centrally placed." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe3591bd9140fd40.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.686, 0.298) come behind point (0.308, 0.903)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9064f9141a90d745.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.298, 0.945) from camera?" }, { "from": "gpt", "value": "75.74 centimeters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a64c5c258f95c71e.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.701, 0.528) or (0.385, 0.716)?" }, { "from": "gpt", "value": "The point (0.385, 0.716) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9de8980a90497aa9.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the crepe stall and want to know how far the point at coordinates point (0.894, 0.889) is from you. What is the distance in feet?" }, { "from": "gpt", "value": "The distance between point (0.894, 0.889) and the viewer is 5.05 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7dd26beba6ecd17.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the rocky shoreline and want to reach the point marked at coordinates (0.542, 0.733). How far is this point from your current position?" }, { "from": "gpt", "value": "The point at (0.542, 0.733) is 7.77 meters away from the viewer, so the distance from your current position at the rocky shoreline to that point is 7.77 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1602177f9654d7d2.jpg", "conversations": [ { "from": "human", "value": "\nYou are an archaeologist examining the stone relief. You need to determine the spatial relationship between the gray stone elephant at center and the gray stone baby elephant at lower center. Which one has a greater width?" }, { "from": "gpt", "value": "The gray stone elephant at center has a greater width than the gray stone baby elephant at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b4b368709476b67.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator planning to fly a drone over the scene. The drone must avoid any obstacles. Given the presence of the metallic wire at upper center, can you determine its exact position to ensure safe navigation?" }, { "from": "gpt", "value": "The metallic wire at upper center is located at coordinates point (0.476, 0.205), so the drone operator should avoid that area to ensure safe navigation." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f223191a71cec76.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is matte gray drawer at lower right from white plastic power strip at upper center?" }, { "from": "gpt", "value": "matte gray drawer at lower right is 85.15 centimeters away from white plastic power strip at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04a0e68661bae419.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte gray suit at left is taller than metallic/matte black microphone at center?" }, { "from": "gpt", "value": "Yes, matte gray suit at left is taller than metallic/matte black microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff8269765244d43a.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to matte black suit at center? Please provide its 2D coordinates.Where can I find matte black suit at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.473, 0.594)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3389e367b7b8ef65.jpg", "conversations": [ { "from": "human", "value": "\nBased on the coordinates provided, which object corresponds to the point at (0.171, 0.569)?" }, { "from": "gpt", "value": "The point at (0.171, 0.569) corresponds to the black woolen robe at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64f39fd7b6c76e4c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of denim jeans at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.289, 0.791)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aadce0c2fc7ed23c.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.705, 0.677) to camera." }, { "from": "gpt", "value": "Point (0.705, 0.677) is 1.73 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84c1185c11dd34c7.jpg", "conversations": [ { "from": "human", "value": "\nIs gray textured blazer at center below striped silk tie at center?" }, { "from": "gpt", "value": "Yes, gray textured blazer at center is below striped silk tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cb60a75abe256c7.jpg", "conversations": [ { "from": "human", "value": "\nIs brown wood reed at center below green leafy tree at upper center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/349847821edb3932.jpg", "conversations": [ { "from": "human", "value": "\nYou are a guest entering the meeting room and see the matte black suit at left and the matte blue shirt at center. Which attendee has a narrower torso? Please answer based on the clothing details." }, { "from": "gpt", "value": "The matte black suit at left has a narrower torso than the matte blue shirt at center because it is thinner." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57cbc01363ffaeda.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black window at center have a lesser height compared to clear glass window at upper right?" }, { "from": "gpt", "value": "In fact, matte black window at center may be taller than clear glass window at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6250041da459e06a.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue water at center appear on the left side of green leafy tree at center?" }, { "from": "gpt", "value": "Correct, you'll find blue water at center to the left of green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd70e193771bf181.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.962, 0.989)?" }, { "from": "gpt", "value": "43.08 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2a8dabeab15d7b0.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.424, 0.755) lie behind point (0.616, 0.531)?" }, { "from": "gpt", "value": "No, it is in front of (0.616, 0.531)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44a40f07ca46a88a.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the white matte cup at table center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.381, 0.661)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f75eea1b21b3c6d.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the green grassy field at lower center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.504, 0.923)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14d6d6a7b5b9a4c0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the sailboat scene. You want to ensure that both the blue water at center and the white canvas sail at center are clearly visible in your photo. Given their sizes, which object should you focus on to ensure both are in frame?" }, { "from": "gpt", "value": "The blue water at center is bigger than the white canvas sail at center, so focusing on the larger blue water at center will help ensure both objects are in frame while maintaining their visibility." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1490698d7f698c84.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is gray wool sweater at lower left from brown textured skirt at center?" }, { "from": "gpt", "value": "They are 9.36 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7afb1a1a1c3b93b2.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.000, 0.864) lie in front of point (0.170, 0.344)?" }, { "from": "gpt", "value": "Yes, point (0.000, 0.864) is in front of point (0.170, 0.344)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b462215a897dfdc.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.519, 0.772) farther from viewer compared to point (0.352, 0.964)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0491b54a213e94ad.jpg", "conversations": [ { "from": "human", "value": "\nHow far is blue silk kurta at left from camera?" }, { "from": "gpt", "value": "blue silk kurta at left and camera are 11.04 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/173b466ceed569ec.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, velvet gray blazer at center or white fabric scarf at center?" }, { "from": "gpt", "value": "white fabric scarf at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddb8c0e17e9d7bfa.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the pink feathered dress at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.338, 0.670)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37219f973a6e07b7.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte gold glasses at upper left and white satin robe at center, which one has less height?" }, { "from": "gpt", "value": "Standing shorter between the two is white satin robe at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/369167fa298a8675.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the rooftop and want to take a photo of the two points. Which point, point (0.358, 0.772) or point (0.264, 0.734), will appear larger in your camera view?" }, { "from": "gpt", "value": "Point (0.358, 0.772) will appear larger in the camera view because it is closer to the camera than point (0.264, 0.734)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3b6e7f7acdb954e.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of camouflage fabric backpack at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.346, 0.600)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9943a287936f5f24.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between white cotton shirt at center and camera?" }, { "from": "gpt", "value": "white cotton shirt at center is 16.47 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4cb71a140a0a07e.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the smooth asphalt parking lot at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.558, 0.952)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd1f9d58bb21b0c7.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between fuzzy brown dog at center and camera." }, { "from": "gpt", "value": "fuzzy brown dog at center is 26.93 inches away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91eed019453a81da.jpg", "conversations": [ { "from": "human", "value": "\nIs blue clear water at center smaller than bamboo bench at right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17bcea3d4cbb2d17.jpg", "conversations": [ { "from": "human", "value": "\nBetween green metal fence at lower right and blue plastic sign at lower center, which one is positioned lower?" }, { "from": "gpt", "value": "green metal fence at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed3b450a18ac1f88.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.133, 0.370) more distant than point (0.901, 0.273)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/564fcb209ba0cf35.jpg", "conversations": [ { "from": "human", "value": "\nLocate knitted woolen hat at upper left in the image." }, { "from": "gpt", "value": "[(0.236, 0.553)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14e4564b8ce6acfc.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.176, 0.573) in the coastal landscape. A hiker wants to know if they can see the grassy island from your current position. Based on the scene description, can they see the island?" }, { "from": "gpt", "value": "The grassy island is located in the middle ground of the scene, which is visible from the foreground where the point (0.176, 0.573) is situated. Since there are no obstructions mentioned between the point and the island, the hiker can see the grassy island from there." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1084a72acd8ca98.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.666, 0.573) from the camera?" }, { "from": "gpt", "value": "Point (0.666, 0.573) is 5.00 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b61b73122e886ec.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the golden brown doughnuts at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.369, 0.786)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da7eecfd9609439b.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.842, 0.844) positioned in front of point (0.558, 0.852)?" }, { "from": "gpt", "value": "No, (0.842, 0.844) is behind (0.558, 0.852)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/447cd19438e050b5.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte trophy at left taller than white shirt at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57e2a2a6eec71f3a.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of black matte jacket at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.842, 0.691)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73c8f94be93a2bc5.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.702, 0.392) farther from camera compared to point (0.504, 0.077)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/082303ff9a383fc9.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white fluffy rooster at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.597, 0.495)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/886f4ca34fb8fc99.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.301, 0.945) and point (0.309, 0.498), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.309, 0.498)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fcdfabbe3af22e3.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between pink matte swim cap at center and camera?" }, { "from": "gpt", "value": "pink matte swim cap at center and camera are 33.81 inches apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84ed7e3e110abd5d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, green algae water at center or brown shiny hair clip at upper right?" }, { "from": "gpt", "value": "From the viewer's perspective, brown shiny hair clip at upper right appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6df1043e5a873969.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark blue jeans at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.165, 0.266)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e4391e10f331adf.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the green leafy tree at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.880, 0.228)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0158e8afbaa7d53a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room and see the green matte christmas tree at center and the black matte shirt at center. Which object is positioned to the right from your perspective?" }, { "from": "gpt", "value": "The green matte christmas tree at center is to the right of the black matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a097ecc3c749d57.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the river and notice a point marked at coordinates (0.291, 0.650). What is located at that point?" }, { "from": "gpt", "value": "At point (0.291, 0.650) lies translucent misty water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/010cdf0102b64f7f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, matte black sunglasses at upper left or black matte goggles at left, stands taller?" }, { "from": "gpt", "value": "Standing taller between the two is matte black sunglasses at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03e9a1db4bc621b2.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.067, 0.769) positioned after point (0.488, 0.677)?" }, { "from": "gpt", "value": "No, (0.067, 0.769) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad23be7604cd44dc.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the denim jacket at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.212, 0.844)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c14d12b90ac80c6d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any purple woolen hat at upper center in the image." }, { "from": "gpt", "value": "[(0.780, 0.723)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36472c11cfa15cbe.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.893, 0.998) and point (0.184, 0.795), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.184, 0.795)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c12915063f19a82f.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, weathered wood picnic table at center or green leafy tree at upper center?" }, { "from": "gpt", "value": "green leafy tree at upper center is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2abba657867b2cc8.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the bronze statue and its pedestal. You notice two points marked on the pedestal. The first point is at coordinates point (0.628, 0.697) and the second at point (0.213, 0.441). Which point is closer to you?" }, { "from": "gpt", "value": "Point (0.628, 0.697) is closer to the viewer than point (0.213, 0.441)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a92beb0dbd9748d.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of brown rough bark tree at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.678, 0.250)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/504e8b8bfc71a193.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte black monitor at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.479, 0.536)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e71ed8ca21c6908.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the historical fortification and see the point marked at coordinates (0.940, 0.762). What does this point represent in the scene?" }, { "from": "gpt", "value": "The point at coordinates (0.940, 0.762) corresponds to the green grassy embankment at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c1528eb7ef70d53.jpg", "conversations": [ { "from": "human", "value": "\nYou are a technician at the exhibition and need to access both the satin black laptop at center and the white plastic robot at lower left. Which object is closer to you when standing directly in front of the table?" }, { "from": "gpt", "value": "The white plastic robot at lower left is closer because the satin black laptop at center is positioned over it, meaning the laptop is further away from you than the robot." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bec26ce1b7a56ee9.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte bicycle helmet at center bigger than black matte goggles at upper left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/227bfec262e88d97.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.331, 0.945) and point (0.810, 0.800), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.810, 0.800)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b9b5d893660bf18.jpg", "conversations": [ { "from": "human", "value": "\nYou are driving a car and see the black asphalt highway at center and the metallic silver van at center through your windshield. Which object is closer to you?" }, { "from": "gpt", "value": "The black asphalt highway at center is closer to you because it is in front of the metallic silver van at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc97e062c605bc5d.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.294, 0.789) and point (0.703, 0.306), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.294, 0.789)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34c0505b216af89b.jpg", "conversations": [ { "from": "human", "value": "\nIs matte wooden door at center positioned in front of matte wood door at left?" }, { "from": "gpt", "value": "No, it is behind matte wood door at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ceace294c9477a5d.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the matte red t-shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.633, 0.441)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bcd1ff6ae6b54b9.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the subway car and want to take a photo of both point (0.953, 0.733) and point (0.361, 0.689) in the image. Which point should you focus on first to ensure both are in clear view?" }, { "from": "gpt", "value": "You should focus on point (0.953, 0.733) first because it is closer to the camera than point (0.361, 0.689), ensuring both points are in clear view." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5c1d50e8355ff50.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer positioned at the bottom of the frame near the purple banner. You need to capture a shot of the gray fleece jacket at center without moving your camera. Can you see the jacket from your current position?" }, { "from": "gpt", "value": "The gray fleece jacket at center is located at point (0.298, 0.614), which is within your field of view from the bottom of the frame near the purple banner. Yes, you can see the jacket without moving your camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e3a63dfb779fb79.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.836, 0.558) or (0.294, 0.503)?" }, { "from": "gpt", "value": "The point (0.836, 0.558) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/610b77b781884f84.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.327, 0.594) or point (0.315, 0.584)?" }, { "from": "gpt", "value": "The point (0.315, 0.584) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a7a517438aebe93.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between fuzzy fur nose at left and brown fur nose at left." }, { "from": "gpt", "value": "fuzzy fur nose at left is 12.83 inches away from brown fur nose at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f96faa6aa37f469.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.051, 0.177) or point (0.906, 0.586)?" }, { "from": "gpt", "value": "Point (0.906, 0.586) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e72faca75c13d251.jpg", "conversations": [ { "from": "human", "value": "\nPoint to denim blue sweater at left.Point to the denim blue sweater at left in the image." }, { "from": "gpt", "value": "[(0.200, 0.666)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a4531d0d3c76a86.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.556, 0.784) and point (0.305, 0.905), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.305, 0.905) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c404fee5b3dfcc4e.jpg", "conversations": [ { "from": "human", "value": "\nDoes green fuzzy hat at upper left have a greater width compared to matte green face at center?" }, { "from": "gpt", "value": "Yes, green fuzzy hat at upper left is wider than matte green face at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e49c46249ac67e48.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.523, 0.406) and point (0.879, 0.552), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.523, 0.406)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05c13568c91722ea.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue rubber toothbrush at center is positioned to the right of red plastic toothbrush at upper right?" }, { "from": "gpt", "value": "Incorrect, blue rubber toothbrush at center is not on the right side of red plastic toothbrush at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8e31cf4bf29fb40.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.490, 0.725) and camera?" }, { "from": "gpt", "value": "Point (0.490, 0.725) is 11.52 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f14bddce71bb5e84.jpg", "conversations": [ { "from": "human", "value": "\nIs weathered wood fence at lower center thinner than green grass at center?" }, { "from": "gpt", "value": "In fact, weathered wood fence at lower center might be wider than green grass at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ecf52820d79d06cc.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of black glossy smartphone at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.338, 0.711)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/069497fbb1122492.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black cotton shirt at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.473, 0.597)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcc66dd59c0e3bf7.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.423, 0.877)." }, { "from": "gpt", "value": "wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/792078f8b31306f2.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.566, 0.366) or point (0.264, 0.816)?" }, { "from": "gpt", "value": "Point (0.566, 0.366)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/975771b0e18db427.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who wants to find the tallest tree in the area. You see a green leafy tree at left and a green leafy tree at center. Which one should you approach to find the taller one?" }, { "from": "gpt", "value": "The green leafy tree at left is taller than the green leafy tree at center, so you should approach the green leafy tree at left to find the taller one." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a28fb9724bf674d.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a parade and need to ensure that the smooth red flag at center can fit into a display case designed for the brown leather jacket at lower right. Given their sizes, will the flag fit inside the case?" }, { "from": "gpt", "value": "The smooth red flag at center is wider than the brown leather jacket at lower right, so it will not fit into the display case designed for the jacket." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95147eb07d3da78f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if translucent yellow lampshade at left is taller than white paper book at center?" }, { "from": "gpt", "value": "Indeed, translucent yellow lampshade at left has a greater height compared to white paper book at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c1f98c5e90a9318.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance from green striped sweater at lower left to matte black projector at upper center." }, { "from": "gpt", "value": "green striped sweater at lower left is 8.23 feet away from matte black projector at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e23923cbe1fdac00.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between pink cotton shirt at center and camera." }, { "from": "gpt", "value": "8.14 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ad86e5bbc02b14a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the autumn scene and want to place a small bench between the green leafy tree at upper center and the dark purple foliage at left. Based on their positions, which object should the bench be closer to?" }, { "from": "gpt", "value": "The green leafy tree at upper center is located above the dark purple foliage at left, so the bench should be placed closer to the dark purple foliage at left to be between them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80a81c4c54262425.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the table where the two people are working. You need to place a 5 feet long banner between you and the gray sweater vest at center. Is there enough space?" }, { "from": "gpt", "value": "The distance between you and the gray sweater vest at center is 7.58 feet, which is greater than the banner length of 5 feet. Therefore, there is enough space to place the banner." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48b6286558fe4584.jpg", "conversations": [ { "from": "human", "value": "\nLocate all pink plastic bag of shrimp at center in the image." }, { "from": "gpt", "value": "[(0.730, 0.567)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e02910334bcc3ca.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy newspaper at center to the left of white ceramic mug at left from the viewer's perspective?" }, { "from": "gpt", "value": "In fact, white glossy newspaper at center is to the right of white ceramic mug at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bec1f74bf3c4800f.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the pink fabric jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.494, 0.581)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b1d67535a0ca93d.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.199, 0.494) from camera?" }, { "from": "gpt", "value": "They are 11.55 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7bbb0c02f2cc30f1.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.617, 0.128)?" }, { "from": "gpt", "value": "green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4441053868c4ea51.jpg", "conversations": [ { "from": "human", "value": "\nIs white textured vest at center wider than white cotton shirt at center?" }, { "from": "gpt", "value": "Indeed, white textured vest at center has a greater width compared to white cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4fb1f88c647953c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver who needs to load more hay bales onto the green matte truck bed at center. The natural straw bales at center are available. Can you fit more of them on the truck bed if they are stacked vertically?" }, { "from": "gpt", "value": "The natural straw bales at center is thinner than green matte truck bed at center, so stacking them vertically would allow more bales to fit on the truck bed since their thinner dimension aligns with the truck bed width." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a85eeba541747048.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, gray wool suit at center or matte black suit at center?" }, { "from": "gpt", "value": "gray wool suit at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06c68a63c2231dda.jpg", "conversations": [ { "from": "human", "value": "\nYou need to know if the black plastic monitor at upper left can fit horizontally on a desk that has enough space for the red matte shirt at center. Can it?" }, { "from": "gpt", "value": "The black plastic monitor at upper left is narrower than the red matte shirt at center, so it can fit horizontally on the desk if the desk has enough space for the red matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52bf628e7910d6f7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if asphalt road at center is thinner than shiny metallic car at center?" }, { "from": "gpt", "value": "No, asphalt road at center is not thinner than shiny metallic car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8de325568e7c10b0.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is white matte projector screen at upper center from gray hoodie at left?" }, { "from": "gpt", "value": "white matte projector screen at upper center is 2.31 meters from gray hoodie at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/054a88e2d6e36b08.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer taking a picture of two people sitting together. You notice the matte gray beanie at center and the matte black beanie at center. Which beanie will appear closer to the camera in the photo?" }, { "from": "gpt", "value": "The matte gray beanie at center appears closer to the camera because it is in front of the matte black beanie at center in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc0dccc561ca863b.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the matte black motorcycle at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.174, 0.672)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcf4a351ce4681d9.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the matte gray letter p at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.617, 0.708)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b089f3f4bb12ed5.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.571, 0.556) or (0.395, 0.166)?" }, { "from": "gpt", "value": "The point (0.395, 0.166) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1447ec4d819fbef.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of black matte suv at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.583, 0.772)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f546a28908f4109.jpg", "conversations": [ { "from": "human", "value": "\nYou are a construction worker who needs to attach a safety harness to the thinnest metal structure in the scene. Which object should you choose between the black metal pole at left and the metallic silver crane at upper right?" }, { "from": "gpt", "value": "The black metal pole at left is thinner than the metallic silver crane at upper right, so you should choose the black metal pole at left for attaching the safety harness." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5508515e3de9a5f7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic gold picture frame at center is positioned above fluffy white dog at center?" }, { "from": "gpt", "value": "Yes, metallic gold picture frame at center is above fluffy white dog at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2db465c3667a1f7.jpg", "conversations": [ { "from": "human", "value": "\nYou are a food critic sitting at a table with a dish in a white ceramic bowl. You notice the brown crispy insects at center. How far are they from you?" }, { "from": "gpt", "value": "The brown crispy insects at center are 3.58 feet away from you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/826f9d35a64f627e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the church and want to place a 3.5 feet wide flower arrangement exactly at the point labeled point (0.723, 0.573). Can you fit it there without moving any other objects?" }, { "from": "gpt", "value": "The point labeled point (0.723, 0.573) is 6.26 feet away from you. Since the flower arrangement is 3.5 feet wide, there is enough space to fit it at that location without moving other objects." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/774e58a268186790.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte gray coat at center have a lesser height compared to shiny silver bicycle at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/352246b18ebeced9.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.630, 0.853) and point (0.244, 0.648), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.630, 0.853) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/826c35b9507bdd59.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white smooth garage door at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.528, 0.234)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/492a1e9c759ad4e5.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green textured tree at right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.945, 0.620)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0537d1b7ce355fa2.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point where the truck is located. There is a point marked at coordinates point (0.769, 0.152). How far is that point from you?" }, { "from": "gpt", "value": "The point point (0.769, 0.152) is 6.77 meters away from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3d300df18e0de67.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, dark gray suit at right or gray suit at left?" }, { "from": "gpt", "value": "dark gray suit at right is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1a9cec46e6578e8.jpg", "conversations": [ { "from": "human", "value": "\nBetween black fabric court at center and black matte jacket at center, which one is positioned lower?" }, { "from": "gpt", "value": "black fabric court at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00ee44f77baf74b0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.489, 0.639)?" }, { "from": "gpt", "value": "yellow-green feathers at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24fb3833d250e7de.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.707, 0.133)?" }, { "from": "gpt", "value": "Point (0.707, 0.133) is 41.08 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b283a0c84068d9c.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of green leafy tree at upper left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.091, 0.378)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bb11769bd70c9f6.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.827, 0.383)?" }, { "from": "gpt", "value": "A distance of 3.97 meters exists between point (0.827, 0.383) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7272f36bd184a17.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the small red wooden house and want to know which chimney is closer to you. Can you tell me which one is closer between the smooth silver chimney at upper center and the smooth brick chimney at upper center?" }, { "from": "gpt", "value": "The smooth silver chimney at upper center is closer to you because it is in front of the smooth brick chimney at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd949c918164fb7d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a clear photo of the matte black helmet at center. However, the matte black motorcycle at left is blocking your view. Can you move around to the right side of the motorcycle to get an unobstructed shot?" }, { "from": "gpt", "value": "The matte black motorcycle at left is in front of the matte black helmet at center, so moving to the right side of the motorcycle would allow you to see the matte black helmet at center without obstruction." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0276e633584e7f95.jpg", "conversations": [ { "from": "human", "value": "\nLocate the blue water at center in the image." }, { "from": "gpt", "value": "[(0.547, 0.873)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f49d7b9d0c2dbde4.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a coat rack for guests at the event. The coat rack has a narrow hook that can only hold items up to 2 inches thick. You need to decide which of the following items can be safely hung on this hook without bending or damaging the hook. Which item from the image can be placed on the narrow hook? The options are the matte black suit at center and the striped jersey at left." }, { "from": "gpt", "value": "The matte black suit at center is thinner than the striped jersey at left, so it can be safely hung on the narrow hook without bending or damaging the hook." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3199ea6048bd03a8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light brown hair at center is smaller than white matte earphone at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea0949f228be5ffd.jpg", "conversations": [ { "from": "human", "value": "\nLocate brown wooden fence at center in the image." }, { "from": "gpt", "value": "[(0.592, 0.586)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac094163b26edf4c.jpg", "conversations": [ { "from": "human", "value": "\nYou are visiting the memorial and want to take a photo of both the bronze statue at center and the bronze statue at upper center. Which statue should you focus on first to ensure both are in the frame?" }, { "from": "gpt", "value": "You should focus on the bronze statue at center first since it is positioned under the bronze statue at upper center, ensuring both are visible in the frame when centered." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/686c51b83be601fb.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of wooden fence at center less distant than that of white plastic triangle at center?" }, { "from": "gpt", "value": "Yes, wooden fence at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22e9deeb7ce200d8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue rubber glove at upper right is positioned below transparent plastic ruler at lower left?" }, { "from": "gpt", "value": "No, blue rubber glove at upper right is not below transparent plastic ruler at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b7e6c6fbf832d69.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of green grass at center in the image." }, { "from": "gpt", "value": "[(0.455, 0.814)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4466508098c3fdd.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the building facade and want to measure the distance between the green painted metal letters at center and the green metallic sign at center. What is the distance between them?" }, { "from": "gpt", "value": "The distance between the green painted metal letters at center and the green metallic sign at center is 47.51 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64552cfedf4ae018.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.091, 0.217) in front of point (0.760, 0.803)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d710e50a836a959f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked by the coordinate point at (0.129, 0.792). The woman with the small blue object is holding it. If you want to hand her a document, how far would you have to walk to reach her?" }, { "from": "gpt", "value": "You would have to walk 21.38 feet to reach the woman with the small blue object." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba1168cfd1bfe93c.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of brown/dusty cloud at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.505, 0.330)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f51f51a8b66fbb96.jpg", "conversations": [ { "from": "human", "value": "\nYou are a virtual assistant analyzing the desktop wallpaper. The image has a monochromatic coastal scene with a lighthouse on the right. There is a point marked at coordinates (0.451, 0.762). What does this point represent?" }, { "from": "gpt", "value": "The point at (0.451, 0.762) marks foggy misty water at bottom left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6bae839a3885e79.jpg", "conversations": [ { "from": "human", "value": "\nIs velvet gold blazer at center to the left of velvet gold jacket at left from the viewer's perspective?" }, { "from": "gpt", "value": "Yes, velvet gold blazer at center is to the left of velvet gold jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/437f28294628991a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, brown fur otter at upper right or brown furry otter at upper right, stands shorter?" }, { "from": "gpt", "value": "Standing shorter between the two is brown furry otter at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d06a882d1adacdc4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer taking a picture of the matte black shirt at center and the white bread hot dog at lower center. Which object will appear larger in the photo?" }, { "from": "gpt", "value": "The matte black shirt at center will appear larger in the photo because it is closer to the viewer than the white bread hot dog at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/520d3ea93e346d57.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper center is smaller than white marble gravestone at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca1aeb74f4245385.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if knitted multicolored blanket at center is shorter than wooden post at lower left?" }, { "from": "gpt", "value": "Correct, knitted multicolored blanket at center is not as tall as wooden post at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e828147f80cb21a.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte/blackboard at center to the right of dark hair at lower left from the viewer's perspective?" }, { "from": "gpt", "value": "No, black matte/blackboard at center is not to the right of dark hair at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6a79cc557796d52.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of white fabric tank top at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.364, 0.595)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbb3328234f34221.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of yellow-green foliage at center-left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.181, 0.833)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1bbb0e87cd6a343.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray matte water at center appear on the right side of green leafy tree at right?" }, { "from": "gpt", "value": "Incorrect, gray matte water at center is not on the right side of green leafy tree at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4719684a9c57873b.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between white plastic boat at lower center and camera?" }, { "from": "gpt", "value": "A distance of 95.79 feet exists between white plastic boat at lower center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22bdd5764a5c7d73.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to black polished wood gondola at right? Please provide its 2D coordinates.Where can I find black polished wood gondola at right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.866, 0.659)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aad6b598fdc462f1.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.660, 0.009) from the camera?" }, { "from": "gpt", "value": "Point (0.660, 0.009) and camera are 38.21 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf34feae4fbafb77.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.404, 0.814) from camera?" }, { "from": "gpt", "value": "The distance of point (0.404, 0.814) from camera is 18.47 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eeaeb16f3eff2fcb.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.255, 0.802)?" }, { "from": "gpt", "value": "matte black laptop at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5a4c388d7ceb754.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.830, 0.828) positioned after point (0.690, 0.617)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1772e7c666043ef3.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the dark blue suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.736, 0.658)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/086db80289e4a799.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green plaid shirt at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.143, 0.561)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5aaabbfdfb209a4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a parent trying to ensure safety for your children playing in a dry, barren area. You notice the pink striped shirt at center and the orange plastic toy at center. Which object is more likely to be visible from a distance due to its height?" }, { "from": "gpt", "value": "The pink striped shirt at center is much taller than the orange plastic toy at center, so it will be more visible from a distance." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9a87b52331e6777.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.717, 0.569) from camera?" }, { "from": "gpt", "value": "Point (0.717, 0.569) is 13.92 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/649adc8417011f10.jpg", "conversations": [ { "from": "human", "value": "\nDoes brick fireplace at center appear over green woven chair at center?" }, { "from": "gpt", "value": "Yes, brick fireplace at center is above green woven chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b996d4ed676ba83.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green plastic street sign at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.341, 0.083)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d58e209614b0883.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.015, 0.855) and point (0.739, 0.269), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.739, 0.269) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4ae5a35f26a0b34.jpg", "conversations": [ { "from": "human", "value": "\nIs light blue waterproof jacket at center to the left of dark gray fleece jacket at upper center from the viewer's perspective?" }, { "from": "gpt", "value": "No, light blue waterproof jacket at center is not to the left of dark gray fleece jacket at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a728fbc63407b41f.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.376, 0.120) more distant than point (0.145, 0.822)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/599b79ea5a3c02b2.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.549, 0.527) or point (0.394, 0.950)?" }, { "from": "gpt", "value": "The point (0.549, 0.527) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bfceb8113a4f340.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of brown stone statue at center in the image." }, { "from": "gpt", "value": "[(0.334, 0.716)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f632d25e8d1b244d.jpg", "conversations": [ { "from": "human", "value": "\nIs concrete at center taller than white glossy airplane at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a67a67707d99a51.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between floral-patterned umbrella at center and camera." }, { "from": "gpt", "value": "floral-patterned umbrella at center is 8.32 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/275447a6ec13bc4a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the baseball stadium and want to know which of the two points, point (0.179, 0.537) or point (0.208, 0.844), is closer to you. Can you determine this based on the scene?" }, { "from": "gpt", "value": "Point (0.179, 0.537) is closer to the viewer than point (0.208, 0.844)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01c36046b9d3490b.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte baseball cap at center wider than green reflective vest at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b6342272ce5de31.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.599, 0.200) or (0.123, 0.569)?" }, { "from": "gpt", "value": "Point (0.123, 0.569) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e34c0bcb838f8640.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a rustic stone ruins at center. Pinpoint a point to the rustic stone ruins at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.630, 0.506)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95256be87b037534.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.348, 0.877) to camera." }, { "from": "gpt", "value": "Point (0.348, 0.877) is 142.56 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90f4178d7d18944b.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.502, 0.648) lie behind point (0.732, 0.620)?" }, { "from": "gpt", "value": "No, it is in front of (0.732, 0.620)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f2574631e76b9e4.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of black wool coat at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.423, 0.608)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ef5ad8ac4ad25b0.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.849, 0.358) and point (0.839, 0.327), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.849, 0.358) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d927b708d4cdee2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a presentation. You need to ensure that the black matte shirt at center is visible in the photo without being blocked by the black plastic projector at center. Based on their heights, can you confirm if the shirt will be visible?" }, { "from": "gpt", "value": "The black matte shirt at center has a greater height compared to the black plastic projector at center, so the shirt will be visible and not blocked by the projector." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35aff983d319d7c9.jpg", "conversations": [ { "from": "human", "value": "\nIs glistening reflective water at center wider than wooden bench at lower center?" }, { "from": "gpt", "value": "Yes, glistening reflective water at center is wider than wooden bench at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d35ebcab3263b01.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between black matte t-shirt at left and black matte mouth at center." }, { "from": "gpt", "value": "The distance of black matte t-shirt at left from black matte mouth at center is 32.29 centimeters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2ed8b894e1eb85e.jpg", "conversations": [ { "from": "human", "value": "\nIs neon green sequined jacket at lower right smaller than yellow plaid shirt at center?" }, { "from": "gpt", "value": "Incorrect, neon green sequined jacket at lower right is not smaller in size than yellow plaid shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/690b626beaaafead.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the street food stall and want to reach the point marked at coordinates point (0.258, 0.642). If your arm can reach 3 feet, can you touch the point without moving your feet?" }, { "from": "gpt", "value": "The distance between you and point (0.258, 0.642) is 4.22 feet, which is longer than your 3 feet reach. Therefore, you cannot touch the point without moving your feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2260e9a449d0613e.jpg", "conversations": [ { "from": "human", "value": "\nPoint to orange matte doughnut at center.Point to the orange matte doughnut at center in the image." }, { "from": "gpt", "value": "[(0.712, 0.530)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6046830ab81d4f7b.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to brown fleece jacket at center? Please provide its 2D coordinates.Where can I find brown fleece jacket at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.515, 0.695)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71a21143f1ef779f.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any translucent pinkish-gold at center in the image." }, { "from": "gpt", "value": "[(0.724, 0.855)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/686cd5bdd92d5f7d.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fluffy cloud at upper center have a lesser width compared to green leafy tree at left?" }, { "from": "gpt", "value": "Incorrect, white fluffy cloud at upper center's width is not less than green leafy tree at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38aa5abbbf0bc4b1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver who needs to park your truck next to the matte white trailer at center. However, there is an asphalt road at lower right nearby. Based on the scene, which object is taller and would block your view when parking?" }, { "from": "gpt", "value": "The asphalt road at lower right is much taller than the matte white trailer at center, so it would block your view when parking." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2839c1ff4eb0f9e5.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.682, 0.742) come closer to viewer compared to point (0.493, 0.358)?" }, { "from": "gpt", "value": "No, it is behind (0.493, 0.358)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b04bdc911b1816b4.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte black table at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.260, 0.875)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8b9223d4946790c.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte laptop at left have a greater width compared to gray plastic crt monitor at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9795f40077697182.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white paper at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.472, 0.214)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/070c7be651579c09.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.464, 0.969) and point (0.025, 0.956), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.464, 0.969) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2326dcdefafb1061.jpg", "conversations": [ { "from": "human", "value": "\nIs pink tie-dye dress at center taller than yellow fabric chair at center?" }, { "from": "gpt", "value": "Incorrect, pink tie-dye dress at center's height is not larger of yellow fabric chair at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e268b2b8061656b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room and want to reach the point marked at coordinates (0.223, 0.895). How far do you need to walk to get there?" }, { "from": "gpt", "value": "The point at coordinates (0.223, 0.895) is 1.25 meters away from you, so you need to walk 1.25 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa0eca8a475cd7b0.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the market and want to reach both the point at coordinates point (0.721, 0.464) and point (0.474, 0.827). Which point will you reach first?" }, { "from": "gpt", "value": "You will reach point (0.721, 0.464) first because it is closer to you than point (0.474, 0.827), which is further away." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffc95f434e883537.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.709, 0.289) farther from camera compared to point (0.538, 0.630)?" }, { "from": "gpt", "value": "Yes, point (0.709, 0.289) is farther from viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6995ac3bf9abf7dc.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.811, 0.817) lie behind point (0.559, 0.803)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e524e2e3a68fc61.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray hoodie at left have a larger size compared to blue matte shirt at center?" }, { "from": "gpt", "value": "Incorrect, dark gray hoodie at left is not larger than blue matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90dc6fc73eb554d0.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the reddish-brown leather jacket at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.311, 0.919)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b0d3d1f4dff5577.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.246, 0.972) closer to viewer compared to point (0.884, 0.344)?" }, { "from": "gpt", "value": "Yes, point (0.246, 0.972) is in front of point (0.884, 0.344)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20cebdf8677944d5.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a blue patterned fabric couch at center. Pinpoint a point to the blue patterned fabric couch at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.298, 0.600)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47ce7ca11c8593da.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.172, 0.897) and camera." }, { "from": "gpt", "value": "Point (0.172, 0.897) and camera are 4.57 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9f4b5d2f86b81d2.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.878, 0.594)." }, { "from": "gpt", "value": "iridescent mesh figure at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cd8af96679e1ae8.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, blue fabric jacket at left or matte blue cap at center?" }, { "from": "gpt", "value": "matte blue cap at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f50cdf220bb469c2.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.620, 0.791) in the image. You need to walk to the wicker basket. How far do you have to walk in feet?" }, { "from": "gpt", "value": "You have to walk 6.56 feet to reach the wicker basket from point (0.620, 0.791)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07ea4ce6322b8c48.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden at center is smaller than smooth red pole at right?" }, { "from": "gpt", "value": "Correct, wooden at center occupies less space than smooth red pole at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f80fd28d7374c00d.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.860, 0.798) positioned before point (0.652, 0.800)?" }, { "from": "gpt", "value": "No, (0.860, 0.798) is further to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c2279e670409c3e.jpg", "conversations": [ { "from": "human", "value": "\nBetween green mossy rocks at center and clear water at center, which one is positioned higher?" }, { "from": "gpt", "value": "clear water at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e6e65aacdaabf3b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the gray concrete pavement at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.507, 0.797)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e898155e78cf3c1d.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.109, 0.780) from camera?" }, { "from": "gpt", "value": "Point (0.109, 0.780) is 4.25 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b24d7aab53e97304.jpg", "conversations": [ { "from": "human", "value": "\nHow close is brick building at center from green leafy tree at upper right?" }, { "from": "gpt", "value": "48.68 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce708ce54578d940.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a matte red cowboy hat at upper right. Pinpoint a point to the matte red cowboy hat at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.615, 0.406)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8be1cbc3899f789a.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of brown/dry wood branch at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.543, 0.217)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9619d97e2e6fde73.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.058, 0.367) and camera." }, { "from": "gpt", "value": "A distance of 3.31 meters exists between point (0.058, 0.367) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e82cb196a4fb5be.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the rectangular swimming pool and looking towards the green leafy tree at upper center. Based on the coordinates provided, in which direction should you walk to reach the tree?" }, { "from": "gpt", "value": "The green leafy tree at upper center is located at coordinates point (0.503, 0.155). Since you are at the center of the pool, you should walk towards the upper center direction to reach the tree." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/601f03ade5f43616.jpg", "conversations": [ { "from": "human", "value": "\nYou are sitting in the passenger seat of a car and notice the purple reflective sunglasses at right. Based on their position coordinates, can you determine if they are closer to the front or back of the car?" }, { "from": "gpt", "value": "The purple reflective sunglasses at right are located at coordinates point (0.907, 0.328). Since the y coordinate is closer to 1, which typically represents the bottom of the image, this suggests they are positioned near the lower part of the car interior, likely closer to the back of the car." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/199a8c17e3c7403e.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of metallic silver sedan at center from camera?" }, { "from": "gpt", "value": "A distance of 3.44 meters exists between metallic silver sedan at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b195612db439dd0c.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.223, 0.170) and point (0.157, 0.309), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.157, 0.309) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/615d57f7ad61e5cf.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, dark gray sweater at lower center or light brown wooden chair at lower center, stands shorter?" }, { "from": "gpt", "value": "dark gray sweater at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/529a9391bec74409.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the black plastic stool at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.247, 0.891)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b4737ef4f96fa54.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the black metal shelf at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.407, 0.502)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05f54ce33686ecaf.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric shirt at right above red cotton shirt at center?" }, { "from": "gpt", "value": "Actually, blue fabric shirt at right is below red cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3859528523982ef7.jpg", "conversations": [ { "from": "human", "value": "\nWhat are the coordinates of the shiny silver phone at center?" }, { "from": "gpt", "value": "The coordinates of the shiny silver phone at center are at point (0.461, 0.334)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0881a6235154b2e.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.780, 0.373) and point (0.614, 0.317), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.614, 0.317) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98f589c980c394df.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.219, 0.711) or (0.401, 0.772)?" }, { "from": "gpt", "value": "The point (0.401, 0.772) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/401a1e0d0071695f.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between orange matte kayak at center and camera." }, { "from": "gpt", "value": "They are 5.53 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e16d34fa2888f4ac.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the Golden Pavilion and want to take a photo of the golden polished wood pagoda at center. If your camera can focus on objects up to 60 meters away, will it be able to capture the pagoda clearly?" }, { "from": "gpt", "value": "The golden polished wood pagoda at center is 63.00 meters away from the camera, which is beyond the camera focus range of 60 meters. Therefore, the camera will not be able to capture the pagoda clearly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dac25c6c603d574c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the park and see the striped cotton shirt at center. If you want to approach it, how far do you need to walk?" }, { "from": "gpt", "value": "The striped cotton shirt at center is 46.61 feet away from you, so you need to walk 46.61 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de16e9f57a5f3ac3.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing an office space and need to move the brown cardboard box at lower left and the green fabric swivel chair at upper left. Based on their current positions, which object is located to the right of the other?" }, { "from": "gpt", "value": "The brown cardboard box at lower left is to the right of the green fabric swivel chair at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/062bd9946f59631c.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between white cotton shirt at left and camera?" }, { "from": "gpt", "value": "4.39 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eabb18fed1f622db.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.684, 0.320) or (0.086, 0.753)?" }, { "from": "gpt", "value": "Positioned in front is point (0.684, 0.320)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c0f0e0fae803354.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the start of the forest trail and see two points marked on the path. The first point is at coordinates point (0.519, 0.989) and the second is at point (0.933, 0.764). Which point is nearer to you as you begin your walk?" }, { "from": "gpt", "value": "Point (0.519, 0.989) is closer to the camera than point (0.933, 0.764), so the first point is nearer to you as you begin your walk." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71ed405d0d6a9828.jpg", "conversations": [ { "from": "human", "value": "\nBetween yellow matte shirt at center and yellow matte t-shirt at center, which one is positioned higher?" }, { "from": "gpt", "value": "Positioned higher is yellow matte t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddcc93fba3df6437.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.332, 0.697) less distant than point (0.682, 0.520)?" }, { "from": "gpt", "value": "Yes, point (0.332, 0.697) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f41d5894b5d1c907.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if asphalt road at center is wider than wooden bench at right?" }, { "from": "gpt", "value": "Yes, asphalt road at center is wider than wooden bench at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9df6700a096ef5c3.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, blonde hair at lower left or matte black laptop at right?" }, { "from": "gpt", "value": "With more height is matte black laptop at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84172c129205529e.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue suit at center have a lesser width compared to white shirt at center?" }, { "from": "gpt", "value": "Incorrect, dark blue suit at center's width is not less than white shirt at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20124544b9d0e8b5.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.811, 0.609) or point (0.287, 0.936)?" }, { "from": "gpt", "value": "Point (0.287, 0.936) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1364a44c2f62a80f.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a multicolored fabric costume at center. Pinpoint a point to the multicolored fabric costume at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.460, 0.572)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/945498568a94f95c.jpg", "conversations": [ { "from": "human", "value": "\nYou are an observer standing at the edge of the stream. You notice the green leafy tree at upper center and the orange life vest at center. Which object is closer to you?" }, { "from": "gpt", "value": "The green leafy tree at upper center is closer to the viewer than the orange life vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c03bd57ff0c4f310.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the middle of the street and see the black matte rail at center and the brushed metal pole at center. Which object is nearer to you?" }, { "from": "gpt", "value": "The black matte rail at center is closer to the viewer than the brushed metal pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91670ecba0990a57.jpg", "conversations": [ { "from": "human", "value": "\nYou are sitting on the velvet red couch at lower center and want to look at the clear water at center. Which object is nearer to you when you look straight ahead?" }, { "from": "gpt", "value": "The velvet red couch at lower center is closer to the viewer than the clear water at center, so the velvet red couch at lower center is nearer to you when you look straight ahead." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff5892a84458a00f.jpg", "conversations": [ { "from": "human", "value": "\nIs blue jeans at center to the right of blue shirt at upper left from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, blue jeans at center is positioned on the right side of blue shirt at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a868d7f2ffa5a0fc.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.614, 0.505) positioned in front of point (0.945, 0.642)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc69dd25a4f38418.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.669, 0.956) come closer to viewer compared to point (0.501, 0.787)?" }, { "from": "gpt", "value": "Yes, point (0.669, 0.956) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df35b5ecfc7b756a.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of matte black shirt at left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.089, 0.608)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75abd4a74a817320.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow fabric at center lie behind yellow satin dress at lower right?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48e526922a333351.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.932, 0.325) or (0.971, 0.447)?" }, { "from": "gpt", "value": "Positioned in front is point (0.971, 0.447)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0374225a59292826.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the matte plastic figure at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.256, 0.173)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5e4d45f33bc7937.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.652, 0.044) lie behind point (0.621, 0.670)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.621, 0.670)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bba5728845a2eff.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green leafy palm at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.190, 0.405)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91418238fdd02141.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.668, 0.706) and point (0.603, 0.381), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.668, 0.706) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aded0d045e18cc0b.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.493, 0.600)?" }, { "from": "gpt", "value": "green velvet cape at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e437ab26ec01a93.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny metallic bicycle at center is bigger than dark brown leather jacket at center?" }, { "from": "gpt", "value": "No, shiny metallic bicycle at center is not bigger than dark brown leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ba69394a4dc2bd6.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of dark gray jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.312, 0.802)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e37c6d0950736132.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the yellow reflective arrow at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.385, 0.766)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44fb3360e404a00b.jpg", "conversations": [ { "from": "human", "value": "\nDoes green feathered bird at upper center have a larger size compared to dark green feathers at upper center?" }, { "from": "gpt", "value": "Yes, green feathered bird at upper center is bigger than dark green feathers at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e8f0f65f1eb6c83.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the green leafy tree at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.489, 0.195)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11b7d788384460fb.jpg", "conversations": [ { "from": "human", "value": "\nYou are a botanist examining the green fuzzy moss at center and the green textured bark at upper center. Which of these two objects is taller?" }, { "from": "gpt", "value": "The green fuzzy moss at center is taller than the green textured bark at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01153e130541cb67.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, pink fabric shirt at center or matte white tank top at left, stands taller?" }, { "from": "gpt", "value": "matte white tank top at left is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85181fbf27b57391.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of dry skin hand at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.578, 0.564)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75081b864dfae1e1.jpg", "conversations": [ { "from": "human", "value": "\nDoes maroon fleece jacket at center come in front of blue fleece jacket at upper right?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/577f3a34b159c312.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.543, 0.933) come in front of point (0.321, 0.509)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5aa07d52e535e67.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.129, 0.611) come closer to viewer compared to point (0.487, 0.320)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2070a638ace6f860.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, brown rough tree at center-left or brown furry horse at lower right, stands taller?" }, { "from": "gpt", "value": "brown rough tree at center-left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e892cc3a21030ff0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black life vest at left is thinner than black fabric life jacket at upper left?" }, { "from": "gpt", "value": "Yes, matte black life vest at left is thinner than black fabric life jacket at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4009f69d7a4bbb14.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue plaid skirt at center is positioned above blue plaid dress at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27c0205776d4be2d.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.118, 0.881) farther from camera compared to point (0.991, 0.586)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13dcfd2517527c36.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance from white matte hijab at center to white striped hoodie at center." }, { "from": "gpt", "value": "A distance of 15.70 meters exists between white matte hijab at center and white striped hoodie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ac964dfb27232e1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if beige leather chair at center is smaller than light brown leather chair at lower right?" }, { "from": "gpt", "value": "No, beige leather chair at center is not smaller than light brown leather chair at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26d4d2facb28dce4.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.470, 0.287) and point (0.137, 0.195), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.137, 0.195) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3abf38e0e8b619d2.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray cotton shirt at center have a larger size compared to dark hair at lower left?" }, { "from": "gpt", "value": "Yes, gray cotton shirt at center is bigger than dark hair at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb1d854561535c5f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, denim shirt at center or green matte polo shirt at left, stands taller?" }, { "from": "gpt", "value": "Standing taller between the two is denim shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38a6dacef62fe777.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of gray hoodie at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.174, 0.669)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7d07d1610bb0958.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of yellow brick ruins at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.578, 0.516)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b92819588d64e04.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the sidewalk and see the brick pavement at center and the orange matte bicycle at center. Which object is located to the right when viewed from your perspective?" }, { "from": "gpt", "value": "The brick pavement at center is to the right of the orange matte bicycle at center, so the brick pavement at center is located to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e218585af383908.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of white powdery snow at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.479, 0.844)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a98638cffa59845.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up a shoot in the living room. You need to position a light source to the left of the marble fireplace at center. Where should you place it in relation to the washed denim jeans at center?" }, { "from": "gpt", "value": "The light source should be placed to the left of the marble fireplace at center, which is also to the left of the washed denim jeans at center since the jeans are to the right of the fireplace." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d934b31245c5b74f.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to brown sweater at center? Please provide its 2D coordinates.Where can I find brown sweater at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.559, 0.398)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ade23e51b0338126.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black hat at center below matte orange shirt at center?" }, { "from": "gpt", "value": "Yes, matte black hat at center is below matte orange shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1f61b71cf5f4f9b.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of glassy steel skyscraper at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.834, 0.539)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f790cd4a8cd0cce3.jpg", "conversations": [ { "from": "human", "value": "\nIs rubberized plastic toy car at right smaller than orange plastic toy at lower left?" }, { "from": "gpt", "value": "Actually, rubberized plastic toy car at right might be larger than orange plastic toy at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4313a524bbdddb37.jpg", "conversations": [ { "from": "human", "value": "\nBetween green leafy tree at left and green leafy tree at right, which one is positioned higher?" }, { "from": "gpt", "value": "green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90b01f2740281b30.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, shiny metallic mantis at center or green plastic sign at center?" }, { "from": "gpt", "value": "green plastic sign at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3ba2c05f69f7606.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light blue stone castle at center is thinner than denim pants at lower right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cab2b25c3742d6ea.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark scaly crocodile at center is smaller than shiny black crocodile at center?" }, { "from": "gpt", "value": "No, dark scaly crocodile at center is not smaller than shiny black crocodile at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70056e40ecedacc6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte sweater at center is wider than stainless steel refrigerator at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c924dc4643f1be6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room with the art installation made of books. You see a point marked at coordinates (0.549, 0.641). Which object is this point located on?" }, { "from": "gpt", "value": "The point at coordinates (0.549, 0.641) is located on the red fabric baby carriage at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55ef9d84c7ffd434.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of silhouette pine at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.473, 0.820)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e7328901f28a7a4.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any clear blue water at center in the image." }, { "from": "gpt", "value": "[(0.491, 0.822)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/374d85e532667dbb.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver approaching the building and need to park your vehicle. You see a gold metallic suv at lower right and a metallic silver car at lower left. Which vehicle is blocking the entrance from your perspective?" }, { "from": "gpt", "value": "The metallic silver car at lower left is behind the gold metallic suv at lower right, so the gold metallic suv at lower right is blocking the entrance from your perspective." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77ebfa9f1b3f6b16.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of striped fabric jacket at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.188, 0.667)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfe41ad1dcd0c9e6.jpg", "conversations": [ { "from": "human", "value": "\nCould you measure the distance between matte purple jacket at center and black leather jacket at center?" }, { "from": "gpt", "value": "They are 4.48 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce084bbf36d138e4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian standing on the sidewalk next to the brushed metal truck at center. You need to cross the road to reach the blue fabric shirt at center. Which direction should you walk along the road before crossing to reach the shirt?" }, { "from": "gpt", "value": "The blue fabric shirt at center is positioned on the right side of the brushed metal truck at center. Since the road curves gently to the right, you should walk along the sidewalk in the direction of the curve, following the road towards the right, then cross to reach the blue fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55422b7d21e8d03d.jpg", "conversations": [ { "from": "human", "value": "\nBetween light blue shirt at center and black plastic laptop at lower right, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "black plastic laptop at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48e44e89bf4c68c5.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric at center positioned at the back of matte blue shirt at upper center?" }, { "from": "gpt", "value": "No, blue fabric at center is in front of matte blue shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71fa553914cc270b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray fabric jacket at center is taller than light gray fabric bag at center?" }, { "from": "gpt", "value": "Yes, dark gray fabric jacket at center is taller than light gray fabric bag at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46f55dce56b7a11a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the historic brick building and notice two green leafy trees. One is labeled as the green leafy tree at left and the other as the green leafy tree at right. Which tree is closer to the building?" }, { "from": "gpt", "value": "The green leafy tree at left is positioned under green leafy tree at right, meaning the green leafy tree at left is closer to the building." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cec51e31c18e0af.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.158, 0.681) positioned behind point (0.641, 0.583)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/782a5a9bf27fae02.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte white shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.309, 0.517)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/837050914b63005d.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the lakeside and want to locate the green water at center. According to the coordinates provided, where exactly should you look?" }, { "from": "gpt", "value": "The green water at center is located at coordinates point (0.438, 0.583)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d28b0366592242b.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the shiny metallic costume at center and the velvet orange cape at center in a single shot. Which one appears closer to your camera lens?" }, { "from": "gpt", "value": "The shiny metallic costume at center appears closer to the camera lens because it is further to the viewer than the velvet orange cape at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b077194f117fea32.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.992, 0.912) more distant than point (0.748, 0.495)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c2f77cd7835680d.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.594, 0.269) from camera?" }, { "from": "gpt", "value": "They are 35.34 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87e260cf1802e4c2.jpg", "conversations": [ { "from": "human", "value": "\nIs brown leather armor at center in front of blue denim jeans at center?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b90859dbce1b1c38.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a white glossy table at center. Pinpoint a point to the white glossy table at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.878, 0.883)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4dd350c11a082f08.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green artificial turf at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.538, 0.895)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b748f34dbed3916.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.060, 0.603)?" }, { "from": "gpt", "value": "They are 2.32 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6fe5637a7b3711a1.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.907, 0.889) and camera." }, { "from": "gpt", "value": "Point (0.907, 0.889) and camera are 15.55 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/178f361668a873a5.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.815, 0.372) or (0.009, 0.163)?" }, { "from": "gpt", "value": "Point (0.009, 0.163)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/777ed612b08497c9.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver metallic jeep at center have a lesser height compared to black hoodie at lower left?" }, { "from": "gpt", "value": "Yes, silver metallic jeep at center is shorter than black hoodie at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b14756cc38c71a25.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of leather boot at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.768, 0.344)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efba136203c6b213.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the brick paved square at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.513, 0.822)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36f77265e7c14645.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.918, 0.395) or (0.040, 0.956)?" }, { "from": "gpt", "value": "The point (0.918, 0.395) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8d8bd0f3a66a29e.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, white fabric flag at right or red fabric flag at center?" }, { "from": "gpt", "value": "Positioned lower is white fabric flag at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27edf233eb5ca2ec.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of black fabric at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.727, 0.362)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af62ec93d9d2b262.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between dark blue uniform at center and camera?" }, { "from": "gpt", "value": "The distance of dark blue uniform at center from camera is 6.76 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e08373950387d80c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the garden scene and want to place a small decorative statue exactly at the center of the garden. Given the green grass at lower left, where would you position the statue to ensure it is centered?" }, { "from": "gpt", "value": "The green grass at lower left is located at point (0.368, 0.920). To center the statue, you would need to position it at the midpoint between this point and the opposite corner of the garden, which would be point (0.632, 0.080)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1ea8f1d2a8ab5fb.jpg", "conversations": [ { "from": "human", "value": "\nYou are an event organizer who needs to arrange seating for two more guests. The current setup has the matte black suit at center and white matte blazer at center. Which of the two has more space available next to it for adding a chair?" }, { "from": "gpt", "value": "The white matte blazer at center has more space available next to it because it is larger than the matte black suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0624c3d444ec3737.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of brown rough rock at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.779, 0.464)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/111a2cff9034c6a5.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.696, 0.362) lie in front of point (0.806, 0.609)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a78a16ec1afe12a.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.256, 0.430) come closer to viewer compared to point (0.447, 0.172)?" }, { "from": "gpt", "value": "Yes, point (0.256, 0.430) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae571f3ff9acd4ac.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.082, 0.991) from the camera?" }, { "from": "gpt", "value": "10.38 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31e5ecd6157c49a1.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the rural landscape scene and want to reach the point marked as point (0.621, 0.997). How far is this point from you?" }, { "from": "gpt", "value": "The point (0.621, 0.997) is 4.46 meters away from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92d13c4617362c03.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.395, 0.725) or (0.774, 0.575)?" }, { "from": "gpt", "value": "Point (0.774, 0.575)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4112abba8e86ad56.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.425, 0.894) and point (0.322, 0.778), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.425, 0.894) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2fd1e773f47293c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, clear glass wine glass at center or translucent glass wine at center?" }, { "from": "gpt", "value": "translucent glass wine at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33ba40caac9b85bc.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in front of the group and want to take a photo that includes both the matte white shark at center and the shiny gold dress at left. Which object should you focus on first to ensure both are in focus?" }, { "from": "gpt", "value": "The matte white shark at center is further to the viewer than the shiny gold dress at left, so you should focus on the matte white shark at center first to ensure both are in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e86b01a85bfe79ee.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the paved path on the left side of the image. You want to see the reflection of the green leafy tree at center in the green reflective water at center. Is the tree reflected in the water?" }, { "from": "gpt", "value": "The green leafy tree at center is positioned over green reflective water at center, so its reflection should be visible in the water since the water is reflective." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ace6663e2f132a13.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between matte gray arm at upper center and matte black hand at center?" }, { "from": "gpt", "value": "5.67 inches" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77d04fe82794a872.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.096, 0.661) from camera?" }, { "from": "gpt", "value": "59.56 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b49f0ebcc9a16b44.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the teal matte boat at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.904, 0.552)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f1478ff2f12b0a2.jpg", "conversations": [ { "from": "human", "value": "\nBetween dark blue denim jacket at center and sunglasses at center, which one has more height?" }, { "from": "gpt", "value": "With more height is dark blue denim jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf85c8a697489273.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.136, 0.639) and point (0.707, 0.575), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.707, 0.575) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e206c72baea7573.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the bedroom and want to adjust the lighting. There are two objects at the center of the room, the white blinds at center and the white glossy lampshade at center. Which object should you approach first if you want to reach the one on the left side first?" }, { "from": "gpt", "value": "The white blinds at center is to the left of white glossy lampshade at center, so you should approach the white blinds at center first." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ef17e814d1ed797.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.603, 0.181)?" }, { "from": "gpt", "value": "dark suit jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9d1938980d5018c.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is black matte necklace at center from camera?" }, { "from": "gpt", "value": "8.38 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01a20398c771c26c.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of matte gray suit at center from camera?" }, { "from": "gpt", "value": "matte gray suit at center and camera are 4.63 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/784d0d0df99942c0.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any white matte t-shirt at center in the image." }, { "from": "gpt", "value": "[(0.373, 0.594)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2233c4eeed5003d.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the tan leather jacket at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.513, 0.623)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70bbff1b793be940.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the town square and want to take a photo of the green copper dome at right. However, the dense foliage of the tree in the foreground is blocking your view. Based on the coordinates provided, can you determine if the dome is visible from your current position?" }, { "from": "gpt", "value": "The green copper dome at right is located at point (0.900, 0.305). Since the tree is in the foreground and partially obscures the view, it is possible that the dome is still visible depending on the exact positioning. However, without additional information about the tree canopy coverage, it is uncertain if the dome is fully visible." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15a8cd0a210830f1.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.520, 0.580) or (0.801, 0.580)?" }, { "from": "gpt", "value": "Point (0.801, 0.580)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e78233134cced8b6.jpg", "conversations": [ { "from": "human", "value": "\nLocate all green grass at lower center in the image." }, { "from": "gpt", "value": "[(0.419, 0.906)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51922780bc56e419.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of white glossy table at lower center?" }, { "from": "gpt", "value": "They are 4.03 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3cb652b27887597e.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any dark gray rocky mountain at center in the image." }, { "from": "gpt", "value": "[(0.509, 0.570)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bcdcec3b095d320.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between matte wood window at center and camera." }, { "from": "gpt", "value": "10.61 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c48858c6d44fbdb8.jpg", "conversations": [ { "from": "human", "value": "\nYou are at point (0.984, 0.242) and want to reach point (0.240, 0.478). Is there a clear path between them?" }, { "from": "gpt", "value": "Yes, since point (0.984, 0.242) is in front of point (0.240, 0.478), there is a clear path between them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ca1de8f69c49e0f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte shirt at center is positioned to the right of black floral swimsuit at center?" }, { "from": "gpt", "value": "No, white matte shirt at center is not to the right of black floral swimsuit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e27dc7a24026f00.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, green grassy field at center or brown dirt track at center, stands taller?" }, { "from": "gpt", "value": "With more height is green grassy field at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97c281619f9c731e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte cityscape at center is smaller than matte paper poster at center?" }, { "from": "gpt", "value": "Incorrect, white matte cityscape at center is not smaller in size than matte paper poster at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f903eb35e097ac31.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth sand dune at lower center is positioned above black plastic license plate at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b29bb3e20de2df70.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black fabric stroller at left is positioned to the right of knitted teal shawl at center?" }, { "from": "gpt", "value": "No, black fabric stroller at left is not to the right of knitted teal shawl at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0450b75f51d3ceb7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny brown bull at center is positioned to the left of shiny brown bull at left?" }, { "from": "gpt", "value": "Incorrect, shiny brown bull at center is not on the left side of shiny brown bull at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d3d4c56c2d25ff8.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at right have a greater width compared to dirt/gravel path at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00020b30ea18e8a3.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and need to capture a photo where both the blue track pants at center and the white matte uniform at center are visible. Which object should you ensure is closer to the camera to avoid it being blocked by the other?" }, { "from": "gpt", "value": "The blue track pants at center is not as tall as the white matte uniform at center, so you should ensure the blue track pants at center is closer to the camera to avoid it being blocked by the taller white matte uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20b76157a1550417.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the middle of the cobblestone alleyway and see two points marked on the ground. One is at point coordinates point (0.372, 0.509) and the other is at point coordinates point (0.418, 0.991). Which point is closer to you?" }, { "from": "gpt", "value": "Point (0.372, 0.509) is closer to you because it is further to the viewer than point (0.418, 0.991)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d25be3862d82386.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper center is positioned to the left of white marble column at center?" }, { "from": "gpt", "value": "Indeed, green leafy tree at upper center is positioned on the left side of white marble column at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08b537a0093ae4f0.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.326, 0.205) come behind point (0.855, 0.209)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.855, 0.209)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fab25afbd0002d35.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer standing outside the Chop Stick Restaurant. You look through the storefront window and see the gold paper sign at center and the light blue fabric at center. Which object is positioned to the right of the other?" }, { "from": "gpt", "value": "The gold paper sign at center is to the right of the light blue fabric at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e50cd1f335773ca4.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.929, 0.522) or (0.563, 0.713)?" }, { "from": "gpt", "value": "Point (0.563, 0.713) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c39db044ada4630.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.027, 0.677) come in front of point (0.091, 0.903)?" }, { "from": "gpt", "value": "No, (0.027, 0.677) is behind (0.091, 0.903)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce345b44b8e0ddd5.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at left have a lesser width compared to brown wooden stakes at lower center?" }, { "from": "gpt", "value": "Indeed, green leafy tree at left has a lesser width compared to brown wooden stakes at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/360ccf102acd8539.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of blue fabric cap at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.213, 0.230)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ba8d6ad381f7e59.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.274, 0.869) positioned in front of point (0.746, 0.433)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/757b59c36b81bdcd.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.449, 0.683) come farther from viewer compared to point (0.159, 0.339)?" }, { "from": "gpt", "value": "No, (0.449, 0.683) is in front of (0.159, 0.339)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5cc46d070e34c80.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.646, 0.684)?" }, { "from": "gpt", "value": "smooth stone column at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7366582ae312919a.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, dark blue fleece jacket at left or blue fabric baseball cap at upper left?" }, { "from": "gpt", "value": "blue fabric baseball cap at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/828b72887760ee8d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.817, 0.673) or point (0.627, 0.494)?" }, { "from": "gpt", "value": "The point (0.627, 0.494) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/975c897c1ad90943.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to matte gray shirt at center? Please provide its 2D coordinates.Where can I find matte gray shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.649, 0.531)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/302e5cc7f02b0864.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.634, 0.466) come in front of point (0.696, 0.912)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/056ec6b5c2db1fc4.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the light gray sweater at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.234, 0.541)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/697703611dd90c26.jpg", "conversations": [ { "from": "human", "value": "\nBetween green matte shirt at center and green cotton shirt at center, which one is positioned lower?" }, { "from": "gpt", "value": "Positioned lower is green matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd42b6f0ea8cdaec.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the base of the mountain and want to reach a specific point marked at coordinates point (0.142, 0.531). Given that your current position is 1500 feet away from this point, can you safely walk towards it without needing to backtrack?" }, { "from": "gpt", "value": "The distance of point (0.142, 0.531) from viewer is 1110.97 feet. Since your current position is 1500 feet away, you are still 389.03 feet away from the point. You can continue walking towards it without needing to backtrack." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e29907c96ce97840.jpg", "conversations": [ { "from": "human", "value": "\nIs white fabric shirt at center shorter than white matte shirt at center?" }, { "from": "gpt", "value": "No, white fabric shirt at center is not shorter than white matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64085d6da8927631.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark brown wood at center is bigger than blue denim shorts at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6570064b44922344.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of bare branches at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.783, 0.300)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c197b6547dab19db.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tailor who needs to adjust the distance between the black matte suit at center and the satin pink blouse at center to 10 inches for a photoshoot. How much should you move one of the garments?" }, { "from": "gpt", "value": "The black matte suit at center is currently 12.12 inches from the satin pink blouse at center. To reduce the distance to 10 inches, you need to move one garment closer by 1.06 inches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df1bba8bb35a85ab.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to take a photo of the green matte trees at center and the wooden boat at center from a distance. Which object will appear bigger in the photo?" }, { "from": "gpt", "value": "The green matte trees at center will appear bigger in the photo because they are larger in size than the wooden boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e53d4eb80fddc99b.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white fabric cap at upper right located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.953, 0.530)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc12503ff15fabf6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, dark gray pinstripe suit at center or clear glass at center, stands shorter?" }, { "from": "gpt", "value": "clear glass at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02991116580d0ff1.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, satin black dress at center or shiny brown hair at center?" }, { "from": "gpt", "value": "Positioned higher is shiny brown hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/badac49ef8449198.jpg", "conversations": [ { "from": "human", "value": "\nYou are an event organizer trying to arrange seating for a panel discussion. You notice two attendees wearing the black sweater at center and the teal fabric shirt at center. Based on their current positions, which attendee should you seat closer to the front of the room to maintain their current spatial relationship?" }, { "from": "gpt", "value": "The black sweater at center should be seated closer to the front of the room because it is positioned under the teal fabric shirt at center, meaning it is currently closer to the bottom of the image and thus closer to the front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77fc3701b19cf106.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.793, 0.736) lie in front of point (0.080, 0.630)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69d1054d2df6c029.jpg", "conversations": [ { "from": "human", "value": "\nYou are a surveyor measuring the distance between the transparent glass river at center and the green leafy hillside at upper center. What is the distance between them?" }, { "from": "gpt", "value": "The distance between the transparent glass river at center and the green leafy hillside at upper center is 78.62 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb8c5b3627dda3cd.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.490, 0.489) come behind point (0.626, 0.569)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2aa33738f04bedce.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between matte white bowl at center and camera." }, { "from": "gpt", "value": "They are 2.66 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cbb4c5eca79c80a.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of brown stone tower at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.412, 0.539)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a377af63eb9d4046.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, purple silk sari at center or white lace table at lower center?" }, { "from": "gpt", "value": "From the viewer's perspective, white lace table at lower center appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2e05dec992187e6.jpg", "conversations": [ { "from": "human", "value": "\nIs gray concrete courtyard at center further to camera compared to white tile church at upper center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85fbee6efae7586d.jpg", "conversations": [ { "from": "human", "value": "\nYou are taking a photo of Marisa, who is standing in front of you. You notice a point at coordinate (0.376, 0.312) on her outfit. How far is this point from the camera?" }, { "from": "gpt", "value": "The point at coordinate (0.376, 0.312) is 1.45 meters away from the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ba3dc8ee995b40c.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the rusty stone rock at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.372, 0.677)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e7507fcff1ca581.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the same location as the photographer capturing this scene. Looking at the matte blue dress shirt at left, where would you position your camera to focus on it? Provide coordinates as a point between 0 and 1 for both x and y, with the origin at the bottom left corner of the image." }, { "from": "gpt", "value": "The coordinates for the matte blue dress shirt at left are at point (0.113, 0.514). To focus on it, position your camera at those coordinates." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a743aa3d94bc9d7.jpg", "conversations": [ { "from": "human", "value": "\nHow much distance is there between wooden posts at lower center and smooth brown tree at upper right?" }, { "from": "gpt", "value": "wooden posts at lower center and smooth brown tree at upper right are 317.31 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac709cf2986810bd.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the garden where the bronze sculptures are displayed. You notice two points marked in the image. The first point is at coordinates point (0.499, 0.041) and the second is at point (0.297, 0.169). Which point is closer to you?" }, { "from": "gpt", "value": "Point (0.499, 0.041) is in front of point (0.297, 0.169), so it is closer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d57800e2acb323bd.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the matte plastic phone box at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.404, 0.550)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0916fd629bde382d.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.345, 0.419) or (0.178, 0.520)?" }, { "from": "gpt", "value": "Positioned in front is point (0.345, 0.419)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9cecfa1d04a7c5d7.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of black plastic wheelchair at left in the image." }, { "from": "gpt", "value": "[(0.447, 0.675)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d994632851c09cc4.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at point 0.0, 0.0 in the park. You want to take a photo of the bronze statue at center. Which direction should you walk to get closer to it?" }, { "from": "gpt", "value": "You should walk towards the northeast direction to reach the bronze statue at center located at point (0.485, 0.180)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3610719936b7daed.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer in the front row of the wrestling match. You want to take a closeup shot of the black matte shirt at center. Based on its position, which direction should you move to get it centered in your viewfinder?" }, { "from": "gpt", "value": "The black matte shirt at center is located at point (0.688, 0.528). To center it in your viewfinder, you should move slightly to the right and up since the coordinates are offset from the center of the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65ea6c6453bc60a5.jpg", "conversations": [ { "from": "human", "value": "\nLocate dark gray sweater at center in the image." }, { "from": "gpt", "value": "[(0.750, 0.606)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c669de0d8d65cd1d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.320, 0.123) or point (0.756, 0.377)?" }, { "from": "gpt", "value": "Positioned behind is point (0.320, 0.123)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf0eb82438607f0c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, smooth bark tree at center or green bark tree at left, stands taller?" }, { "from": "gpt", "value": "With more height is green bark tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f3c53204d56accc.jpg", "conversations": [ { "from": "human", "value": "\nDoes checkered fabric shirt at center have a larger size compared to translucent glass beer at center?" }, { "from": "gpt", "value": "Indeed, checkered fabric shirt at center has a larger size compared to translucent glass beer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eba5b1accc074340.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, gray knitted glove at center or black plastic tablet at upper center?" }, { "from": "gpt", "value": "black plastic tablet at upper center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e40eb68aec608d0.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, matte white window frame at center or brown textured plant at center?" }, { "from": "gpt", "value": "brown textured plant at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/924569019648569f.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.261, 0.664)?" }, { "from": "gpt", "value": "black matte/soft fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f48fd6ed6101b23.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green fabric table at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.841, 0.914)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29c2b0571cdc14df.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte glass window at right and crumbly brown bread at lower center, which one has more height?" }, { "from": "gpt", "value": "matte glass window at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb687f57053e302a.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the glossy plastic box at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.502, 0.289)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b8f21736b292bb4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up a shot of the two children in the scene. You need to position a small stool between the beige soft coat at center and the black matte jacket at center so that it doesn" }, { "from": "gpt", "value": "The beige soft coat at center has a lesser height compared to black matte jacket at center, so the stool should be placed closer to the beige soft coat at center to ensure both children can comfortably reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adc482f7cf16ab4c.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.591, 0.702) in front of point (0.346, 0.828)?" }, { "from": "gpt", "value": "No, it is behind (0.346, 0.828)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca781c76e704b44b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the crowd at the protest. There is a point at coordinate (0.250, 0.608). How far is that point from you?" }, { "from": "gpt", "value": "The point at coordinate (0.250, 0.608) is 22.65 feet away from you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bfc156886ad7fe4.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.828, 0.800) positioned after point (0.379, 0.283)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a0825ac8d79f135.jpg", "conversations": [ { "from": "human", "value": "\nDoes plaid fabric hat at upper center appear under white soft lamb at center?" }, { "from": "gpt", "value": "No, plaid fabric hat at upper center is not below white soft lamb at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b256bc2b19dded74.jpg", "conversations": [ { "from": "human", "value": "\nBetween green grassy at center and clear water at center, which one has more height?" }, { "from": "gpt", "value": "clear water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/334f622348df8e15.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer comparing two LG Optimus One smartphones displayed in a store. You see the matte black phone at center and the metallic blue phone at center. Which one do you think is larger?" }, { "from": "gpt", "value": "The matte black phone at center is bigger than the metallic blue phone at center, so the matte black phone at center is larger." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cd80dd2db24b6d4.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.640, 0.544) closer to viewer compared to point (0.659, 0.581)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4a37a607f0463d7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte gas stove at left is thinner than smooth yellowish bowl at right?" }, { "from": "gpt", "value": "Incorrect, black matte gas stove at left's width is not less than smooth yellowish bowl at right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/219aaebbf74c0129.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the black glossy car at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.906, 0.920)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efdcb2fc53bcca6f.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of snowy granite mountain range at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.531, 0.511)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e1c5421bfbc079e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer adjusting the camera settings. The black glossy sunglasses at center are positioned at coordinates 0.728 on the x and 0.718 on the y. If the camera focuses on the nose and upper lip, which are at the center of the image, will the sunglasses be in focus?" }, { "from": "gpt", "value": "The black glossy sunglasses at center are located at point (0.718, 0.728), which is slightly off the exact center of the image. Since the camera focuses on the nose and upper lip at the center, the sunglasses may not be fully in focus, especially given the shallow depth of field mentioned in the scene description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39198eca31ffa284.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.218, 0.734) or point (0.836, 0.758)?" }, { "from": "gpt", "value": "Point (0.836, 0.758) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/052a9d8f7633b365.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white picket fence at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.427, 0.906)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec037cdccbced51c.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of maroon hoodie at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.787, 0.686)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f7c1bbe6b29f80a.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a metallic street sign at center-right. Pinpoint a point to the metallic street sign at center-right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.852, 0.664)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40a61074ecdffc66.jpg", "conversations": [ { "from": "human", "value": "\nLocate the stone tower at right in the image." }, { "from": "gpt", "value": "[(0.845, 0.472)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce2b99ca4dbfd657.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of gray wool sweater vest at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.351, 0.706)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7249e2558bf3e90b.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.685, 0.717) and point (0.416, 0.470), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.416, 0.470)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7dfb3ff01d79f8d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of green leafy tree at upper left in the image." }, { "from": "gpt", "value": "[(0.232, 0.080)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ee091cb3fb03ee5.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.438, 0.758)?" }, { "from": "gpt", "value": "white matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1639a331fca9c853.jpg", "conversations": [ { "from": "human", "value": "\nBetween shiny black rooster at center and black and white feathers at center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, black and white feathers at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/474be7dcb750c0a6.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any clear blue water at center in the image." }, { "from": "gpt", "value": "[(0.500, 0.753)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02a92f4632e54866.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the concert. You want to capture a clear photo of both the purple matte shirt at center and the shiny blue jacket at center. Which one should you focus on to ensure both are in focus?" }, { "from": "gpt", "value": "To ensure both the purple matte shirt at center and the shiny blue jacket at center are in focus, you should focus on the purple matte shirt at center since it is in front of the shiny blue jacket at center, allowing the depth of field to cover both objects." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77292f670744930a.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.366, 0.469) from camera?" }, { "from": "gpt", "value": "Point (0.366, 0.469) is 46.76 centimeters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c15811b4198aecaa.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at a certain distance from the gray textured cat at center. You want to take a closeup photo of it. Do you need to move closer or farther away?" }, { "from": "gpt", "value": "The gray textured cat at center is 1.27 meters away from camera. To take a closeup photo, you need to move closer to reduce the distance between the camera and the cat." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d7fc260ec44347f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a sports analyst watching the game. You notice a point marked at coordinates (0.295, 0.047) on the field. Based on the scene, what object is located at that point?" }, { "from": "gpt", "value": "The point at coordinates (0.295, 0.047) marks the location of the dark blue jersey at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f002be842d1fae8.jpg", "conversations": [ { "from": "human", "value": "\nIs clear water at center to the right of metallic gray bridge at center from the viewer's perspective?" }, { "from": "gpt", "value": "In fact, clear water at center is to the left of metallic gray bridge at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10a448b560172b02.jpg", "conversations": [ { "from": "human", "value": "\nYou are attending a council anniversary event and see the blue fabric at center and the gray suit at center. Which one is positioned lower in the image?" }, { "from": "gpt", "value": "The blue fabric at center is below gray suit at center, so the blue fabric at center is positioned lower in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09a7532a9dce9603.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between yellow-black dragonfly at center and camera?" }, { "from": "gpt", "value": "The distance of yellow-black dragonfly at center from camera is 4.89 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3db1a151186a0e99.jpg", "conversations": [ { "from": "human", "value": "\nLocate all shiny orange plush bear at center in the image." }, { "from": "gpt", "value": "[(0.552, 0.506)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/add88bfd13f0d813.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if transparent wireframe cylinder at center is shorter than green matte nail polish at upper right?" }, { "from": "gpt", "value": "Incorrect, transparent wireframe cylinder at center's height does not fall short of green matte nail polish at upper right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2e40ddf2d11678c.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at left have a greater width compared to dark gray stone spire at center?" }, { "from": "gpt", "value": "Yes, green leafy tree at left is wider than dark gray stone spire at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d67a40d0959235f2.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.294, 0.658) or (0.642, 0.616)?" }, { "from": "gpt", "value": "Point (0.294, 0.658) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1a305077a312c9e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.885, 0.762) or point (0.436, 0.542)?" }, { "from": "gpt", "value": "Positioned in front is point (0.885, 0.762)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/700ccf0be4639fe8.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of green grassy hillside at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.518, 0.867)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4409e6e79cf91158.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.687, 0.614) and camera." }, { "from": "gpt", "value": "Point (0.687, 0.614) and camera are 6.63 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99c2767f3e66d910.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between red satin tablecloth at center and matte gold lampshade at right." }, { "from": "gpt", "value": "red satin tablecloth at center is 19.89 inches away from matte gold lampshade at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a2ad796e482c228.jpg", "conversations": [ { "from": "human", "value": "\nYou are an interior designer analyzing the placement of objects in the image. The matte gray suit at left is positioned at a specific coordinate. Can you determine its exact coordinates?" }, { "from": "gpt", "value": "The matte gray suit at left is located at the coordinates point (0.292, 0.648)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9fc375431da5e32a.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth silk tie at right wider than smooth fabric tie at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21607430d1a7cf85.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the transparent glass sphere at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.481, 0.495)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c80db3d22646d383.jpg", "conversations": [ { "from": "human", "value": "\nBetween shiny sand at lower center and silhouette shorts at center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "shiny sand at lower center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ba0dbc88f47be4f.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of translucent plastic dressing bottle at upper right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.825, 0.327)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9dd37202d29733e3.jpg", "conversations": [ { "from": "human", "value": "\nLocate all green leafy palm tree at upper right in the image." }, { "from": "gpt", "value": "[(0.868, 0.166)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63e208e0c41aa17e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a traveler at the transportation hub and see a gray cotton shirt at lower left and a striped shirt at center. Which shirt is taller?" }, { "from": "gpt", "value": "The gray cotton shirt at lower left is taller than striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb417ffbae6fe9d2.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of a white matte trailer truck at center. You want to walk to the building in the background. How far is the building from you?" }, { "from": "gpt", "value": "The distance between the white matte trailer truck at center and the viewer is 5.91 meters. However, the exact distance to the building in the background is not provided in the scene description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3e871254d25ee49.jpg", "conversations": [ { "from": "human", "value": "\nYou are a guest in this living room and want to sit closer to the heat source. Which object should you move towards, the metallic fireplace at center or the black fur cat at lower right?" }, { "from": "gpt", "value": "The metallic fireplace at center is larger than the black fur cat at lower right, so you should move towards the metallic fireplace at center to get closer to the heat source." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5aa98ac50a7690fa.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte black shirt at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.122, 0.561)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/626bc6fd804b0219.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.540, 0.748)?" }, { "from": "gpt", "value": "yellow matte soap at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34a0a073e8f8035b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, smooth concrete pavement at center or brown rough textured tortoise at left?" }, { "from": "gpt", "value": "From the viewer's perspective, smooth concrete pavement at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48ef951d1a928568.jpg", "conversations": [ { "from": "human", "value": "\nYou are a city planner reviewing this urban layout. You need to determine the spatial relationship between the white glass skyscraper at left and the smooth glass skyscraper at center. Which one is positioned lower in the aerial view?" }, { "from": "gpt", "value": "The white glass skyscraper at left is located below the smooth glass skyscraper at center, so it is positioned lower in the aerial view." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ed3cab053c0ec32.jpg", "conversations": [ { "from": "human", "value": "\nYou are a security guard in the lab and need to check both the black pinstripe suit at left and the black plastic laptop at lower right. Which object should you check first based on their positions?" }, { "from": "gpt", "value": "The black pinstripe suit at left should be checked first because it is closer to the security guard than the black plastic laptop at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6764bd04d8e5520.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, clear water at lower left or dark brown skin at lower center?" }, { "from": "gpt", "value": "dark brown skin at lower center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b90a522843326b8.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white striped shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.745, 0.616)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79d8d159ce12e36b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.588, 0.366) or point (0.724, 0.338)?" }, { "from": "gpt", "value": "Point (0.588, 0.366) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/931445e0fb78221e.jpg", "conversations": [ { "from": "human", "value": "\nBetween knitted wool hat at center and matte red knit hat at center, which one has less height?" }, { "from": "gpt", "value": "matte red knit hat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f55da93d9ffa9e70.jpg", "conversations": [ { "from": "human", "value": "\nDoes white striped polo shirt at center have a smaller size compared to gold-framed picture at upper center?" }, { "from": "gpt", "value": "Incorrect, white striped polo shirt at center is not smaller in size than gold-framed picture at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41c428692eedceeb.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.619, 0.395) positioned behind point (0.001, 0.770)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.001, 0.770)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7076f222d3873ef8.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the payphone booth and want to reach the two points marked in the image. Which point, point (0.521, 0.778) or point (0.487, 0.425), is closer to you?" }, { "from": "gpt", "value": "Point (0.521, 0.778) is in front of point (0.487, 0.425), so it is closer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/398998a3de9986af.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who just arrived at the trailhead and see the green matte bicycle at left leaning against the path. If you want to reach the bicycle, how far do you have to walk from your current position?" }, { "from": "gpt", "value": "The green matte bicycle at left is 14.71 meters away from your current position, so you need to walk that distance to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87a26b23424a7cca.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer positioned at the edge of the pool in the dolphinarium. You want to capture a photo of the dark hair at center and the dark brown leather jacket at lower left in the same frame. Based on their sizes, can you fit both subjects into your camera viewfinder without zooming in?" }, { "from": "gpt", "value": "The dark hair at center might be wider than dark brown leather jacket at lower left, so there is a possibility that both can fit into the camera viewfinder without zooming in, but it depends on their actual widths." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68b53748ed1b2900.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.791, 0.602) positioned in front of point (0.106, 0.408)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.106, 0.408)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/538702f2400355d0.jpg", "conversations": [ { "from": "human", "value": "\nBetween black cotton shirt at right and green fabric shirt at center, which one is positioned lower?" }, { "from": "gpt", "value": "green fabric shirt at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c077609768689f05.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black shipping container at center is wider than matte black shipping container at right?" }, { "from": "gpt", "value": "In fact, matte black shipping container at center might be narrower than matte black shipping container at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f4bf3478a8c9ad4.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black cape at center to the right of denim jacket at lower left from the viewer's perspective?" }, { "from": "gpt", "value": "Correct, you'll find matte black cape at center to the right of denim jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4070d0958fe7b97a.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of dark blue sweater at center less distant than that of maroon sleeveless top at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12ec6775d0ad6729.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, clear glass window at upper left or white glossy counter top at center?" }, { "from": "gpt", "value": "Positioned higher is clear glass window at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c818aab3293ab632.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance from yellow matte jacket at lower left to yellow matte shirt at center." }, { "from": "gpt", "value": "yellow matte jacket at lower left is 39.00 feet away from yellow matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f108d826322b1b20.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of gray wool sweater at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.166, 0.584)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a2c35d801062e5d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a crane operator trying to lower the white plastic boat at center into the clear water at boat right. What is the minimum distance you need to lower the boat to ensure it reaches the water?" }, { "from": "gpt", "value": "The white plastic boat at center is 27.52 meters from the clear water at boat right, so you need to lower it at least 27.52 meters to ensure it reaches the water." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27c67177c50fdd85.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.055, 0.886)?" }, { "from": "gpt", "value": "yellow-green jersey at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7bb0eb7f9926307.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between rustic clay cliff at center and camera?" }, { "from": "gpt", "value": "rustic clay cliff at center is 53.52 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed00bd6591ccc403.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the water in the image. If you want to walk to the wooden statue at center, which direction should you head towards?" }, { "from": "gpt", "value": "The wooden statue at center is located at point 0.683 on the x axis and 0.502 on the y axis. Since you are at the edge of the water, you should walk towards the direction of the statue which is in the center of the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93ff0e7d61f0e3ab.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown matte tree at center is positioned to the right of brown textured bush at right?" }, { "from": "gpt", "value": "Indeed, brown matte tree at center is positioned on the right side of brown textured bush at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6e535a6360ce107.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the dark gray fabric shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.413, 0.805)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f5bfbc086960dfd.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room and want to locate the point at coordinates (0.488, 0.455). Based on the scene description, where would this point be located relative to the wooden frame window at upper center?" }, { "from": "gpt", "value": "The point at coordinates (0.488, 0.455) is located on the wooden frame window at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a7b53a2c0545e17.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.620, 0.461) from camera?" }, { "from": "gpt", "value": "Point (0.620, 0.461) and camera are 12.16 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/209ccbe15dea1d00.jpg", "conversations": [ { "from": "human", "value": "\nDoes black asphalt highway at center appear on the left side of metallic blue trailer truck at center?" }, { "from": "gpt", "value": "In fact, black asphalt highway at center is to the right of metallic blue trailer truck at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b822706c32e41c45.jpg", "conversations": [ { "from": "human", "value": "\nYou are a waiter carrying a tray of drinks and need to move from the golden glass carlsberg at left to the white marble table at center. Given that your tray is 1.2 meters wide, can you safely navigate the space between them without spilling the drinks?" }, { "from": "gpt", "value": "The distance between the golden glass carlsberg at left and the white marble table at center is 2.82 meters. Since your tray is only 1.2 meters wide, there is sufficient space to navigate safely between them without any obstruction." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea8b48b224e171af.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing behind the black fence. You want to capture a clear photo of the blue matte soccer jersey at center without the green grass at center blocking the view. Is this possible given their positions?" }, { "from": "gpt", "value": "The green grass at center is in front of the blue matte soccer jersey at center, so it will block the view. You need to adjust your angle or move closer to ensure the jersey is visible without obstruction." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cac58601dd8d8177.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of brown stone at lower center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.326, 0.869)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93fe69d2fa26d258.jpg", "conversations": [ { "from": "human", "value": "\nLocate shiny red dress at center in the image." }, { "from": "gpt", "value": "[(0.289, 0.769)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a7a905e17a7fe54.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.578, 0.933) from camera?" }, { "from": "gpt", "value": "Point (0.578, 0.933) is 1.24 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3487e1a0b703f36e.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.332, 0.833) come farther from viewer compared to point (0.091, 0.559)?" }, { "from": "gpt", "value": "No, (0.332, 0.833) is in front of (0.091, 0.559)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/005241bcf968699f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of a stone plaza and see a person in denim at center taking a photo. If you want to approach them without being in their frame, how far should you stay behind?" }, { "from": "gpt", "value": "The denim at center and viewer are 3.20 meters apart, so to avoid being in their frame, you should stay at least 3.20 meters behind the denim at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc863ef8ec55daa5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the shiny red mesh shoe at center and the white soft sock at center. Which object should you focus on first if you want to ensure both are in sharp focus?" }, { "from": "gpt", "value": "The shiny red mesh shoe at center is located below the white soft sock at center. To ensure both are in sharp focus, you should focus on the white soft sock at center first since it is farther away from the camera, allowing the depth of field to cover the closer shiny red mesh shoe at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f4fa42c6f03165e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a referee watching the basketball game. You notice the white matte shirt at right and the glossy rubber basketball at upper center. Which object is closer to the front of the scene?" }, { "from": "gpt", "value": "The white matte shirt at right is closer to the front of the scene because the glossy rubber basketball at upper center is behind it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f22b60e90759b76.jpg", "conversations": [ { "from": "human", "value": "\nBetween brown rough tree at center and brown brick barn at center, which one has less height?" }, { "from": "gpt", "value": "Standing shorter between the two is brown brick barn at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5f9aa1fe48e9f90.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the image and want to take a photo of the white stone clock tower at upper left. In which direction should you point your camera?" }, { "from": "gpt", "value": "The white stone clock tower at upper left is located at point (0.182, 0.228), so you should point your camera to the upper left direction to capture it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9477dfb44924f0e9.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of yellowmaterial/textureparking sign at center in the image." }, { "from": "gpt", "value": "[(0.592, 0.839)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4a0bfa7ca271944.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the green striped sari at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.553, 0.414)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61040ea4bec88347.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, black matte camera at left or jeans at center?" }, { "from": "gpt", "value": "black matte camera at left is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8740c53f3e3028cc.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a closeup of the smooth plastic bottle at left without the smooth black blouse at center blocking it. Can you move the bottle to the right to avoid the blouse?" }, { "from": "gpt", "value": "The smooth black blouse at center is positioned over the smooth plastic bottle at left, so moving the bottle to the right would help avoid the blouse blocking it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5be53f2a95b4097b.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white matte guitar at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.493, 0.452)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b528b838e21f37e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a golfer standing on the gray gravel path at left and want to hit the ball into the transparent plastic hole at center. Which direction should you aim to reach the hole?" }, { "from": "gpt", "value": "The gray gravel path at left is closer to the viewer than the transparent plastic hole at center, so you should aim forward towards the transparent plastic hole at center to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/072ec80583cb15b4.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.429, 0.347) less distant than point (0.319, 0.519)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46a188afd2ffe723.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of silver metallic pole at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.301, 0.502)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b121540f9c07a37b.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.538, 0.530)?" }, { "from": "gpt", "value": "matte white jumpsuit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7d99fa570f536e7.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.727, 0.642) or point (0.699, 0.216)?" }, { "from": "gpt", "value": "Point (0.727, 0.642) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c62e7d0703b6636b.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, brown glass beer bottle at center or wooden coaster at center?" }, { "from": "gpt", "value": "With more height is brown glass beer bottle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aca7f42ac35e16b3.jpg", "conversations": [ { "from": "human", "value": "\nIs brown crispy shrimp at center further to the viewer compared to shiny brown nuts at center?" }, { "from": "gpt", "value": "No, it is in front of shiny brown nuts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f519100c89d77d87.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black pinstripe suit at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.307, 0.528)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21c75821c91cf866.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.088, 0.517) less distant than point (0.024, 0.517)?" }, { "from": "gpt", "value": "Yes, point (0.088, 0.517) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bf629762fd155f6.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.850, 0.333) farther from camera compared to point (0.884, 0.128)?" }, { "from": "gpt", "value": "No, (0.850, 0.333) is in front of (0.884, 0.128)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f9de48ce515926b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear glass window at center is bigger than dark blue denim jeans at lower left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aba02e9aedb22a27.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.368, 0.469) or (0.353, 0.352)?" }, { "from": "gpt", "value": "Point (0.368, 0.469)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2cc748c0015723cf.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, matte blue car at upper left or shiny blue car at lower left?" }, { "from": "gpt", "value": "matte blue car at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6148305563c07005.jpg", "conversations": [ { "from": "human", "value": "\nIs green fabric umbrella at left below green fabric umbrella at center?" }, { "from": "gpt", "value": "Yes, green fabric umbrella at left is below green fabric umbrella at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1eea0a5368313123.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue t-shirt at center come behind matte balloons at upper left?" }, { "from": "gpt", "value": "No, matte blue t-shirt at center is in front of matte balloons at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/001ddffdc17b24e4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a group photo. You need to ensure there is enough space between the matte black jacket at center and the white matte table at center for your camera equipment. The equipment requires a minimum of 50 centimeters of space. Based on the scene, can you fit your equipment between them?" }, { "from": "gpt", "value": "The distance between the matte black jacket at center and the white matte table at center is 47.99 centimeters, which is less than the required 50 centimeters. Therefore, the equipment cannot fit between them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/724f6855b0e38b18.jpg", "conversations": [ { "from": "human", "value": "\nYou are a stagehand who needs to move the wooden drum at center and the shiny metallic microphone at upper left to the storage room. Based on their sizes, which one should you carry first to ensure you can fit both items through the narrow doorway?" }, { "from": "gpt", "value": "The wooden drum at center is larger than the shiny metallic microphone at upper left, so you should carry the shiny metallic microphone at upper left first to ensure both items can fit through the narrow doorway." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/780669ad184fdb58.jpg", "conversations": [ { "from": "human", "value": "\nBetween blue lace dress at center and wooden table at center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, wooden table at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7dce7d9ba646604f.jpg", "conversations": [ { "from": "human", "value": "\nIs brown fur scarf at center taller than black fleece at right?" }, { "from": "gpt", "value": "In fact, brown fur scarf at center may be shorter than black fleece at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ed0ef873d160ddd.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.423, 0.330) come farther from viewer compared to point (0.584, 0.753)?" }, { "from": "gpt", "value": "No, it is in front of (0.584, 0.753)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e106b11f54be46e.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of dark gray suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.513, 0.686)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8d157563bcfe482.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a blue plastic swing at lower left. Pinpoint a point to the blue plastic swing at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.077, 0.797)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ffc1b1917db30fc.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the beach and want to take a photo of the white sailboat at center. Where should you aim your camera to capture it?" }, { "from": "gpt", "value": "You should aim your camera at point (0.338, 0.562) to capture the white sailboat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44247baa790ac2d8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the worn leather slipper at lower right and the worn leather shoe at lower left in a composition. Which object is located to the right of the other?" }, { "from": "gpt", "value": "The worn leather slipper at lower right is positioned on the right side of worn leather shoe at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdff363095e6c90f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.502, 0.452) in the image. How far are you from the viewer?" }, { "from": "gpt", "value": "The distance of point (0.502, 0.452) from viewer is 6.13 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8fa4c106b8e5da8.jpg", "conversations": [ { "from": "human", "value": "\nIs brick church at center smaller than gray concrete tower at upper right?" }, { "from": "gpt", "value": "Actually, brick church at center might be larger than gray concrete tower at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b16005712ece2230.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between black wood porch at center and black matte chair at lower left." }, { "from": "gpt", "value": "The distance of black wood porch at center from black matte chair at lower left is 26.96 centimeters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e31ab5315f06dbb1.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.591, 0.681) or point (0.383, 0.286)?" }, { "from": "gpt", "value": "The point (0.383, 0.286) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25c8326e05345a68.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the dock and want to get to the red wooden hut at center. Which direction should you move to avoid the muddy water at lower center?" }, { "from": "gpt", "value": "Since the muddy water at lower center is below the red wooden hut at center, you should move upward towards the red wooden hut at center to avoid stepping into the muddy water at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53db24a9e846a6dc.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte shorts at lower left wider than green fabric jacket at center?" }, { "from": "gpt", "value": "Indeed, black matte shorts at lower left has a greater width compared to green fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d363206b48848fd1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a group photo in the office. You notice the denim jacket at lower right and the metallic silver frame at center. Which object should you adjust your camera focus to first if you want to capture both objects clearly in the same shot?" }, { "from": "gpt", "value": "The denim jacket at lower right is larger in size than the metallic silver frame at center, so you should focus on the denim jacket at lower right first to ensure its details are sharp before adjusting for the smaller metallic silver frame at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a27c78ba8764da20.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from green grass at lower center to camera." }, { "from": "gpt", "value": "6.48 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5356808226c4f9a8.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the beige sweater at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.568, 0.706)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58a97c675fbf507f.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of black mesh office chair at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.278, 0.662)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1bef6d24f1f3687.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange matte shirt at center have a smaller size compared to blue fabric wheelchair at left?" }, { "from": "gpt", "value": "Correct, orange matte shirt at center occupies less space than blue fabric wheelchair at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/908fbd11801dbe69.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at point (0.431, 0.616) on the train station platform. You want to walk to point (0.570, 0.714). According to the scene description, which direction should you face to move towards your destination?" }, { "from": "gpt", "value": "You should face forward because point (0.570, 0.714) is in front of point (0.431, 0.616)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5eab8497364d3f7e.jpg", "conversations": [ { "from": "human", "value": "\nDoes purple scarf at upper right appear over camouflage pants at left?" }, { "from": "gpt", "value": "Indeed, purple scarf at upper right is positioned over camouflage pants at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8820c1496d974144.jpg", "conversations": [ { "from": "human", "value": "\nIs printed cotton shirt at center taller than white striped polo shirt at center?" }, { "from": "gpt", "value": "Incorrect, printed cotton shirt at center's height is not larger of white striped polo shirt at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e72c7b9d0a80960.jpg", "conversations": [ { "from": "human", "value": "\nYou are an astronomer observing the sky and the landscape. You notice the purple matte cloud at upper center and the rusty stone rock at left. Which object is closer to your line of sight?" }, { "from": "gpt", "value": "The purple matte cloud at upper center is closer to your line of sight because it is further to the viewer than the rusty stone rock at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd16257b0304ccf3.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.151, 0.512) and camera?" }, { "from": "gpt", "value": "Point (0.151, 0.512) and camera are 7.87 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b04420863615d287.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green camouflage shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.792, 0.475)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0650ebc703d371c.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of brown wood railing at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.203, 0.603)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ae110884e0736d5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black fabric table at center is taller than dark gray fabric chair at center?" }, { "from": "gpt", "value": "Indeed, black fabric table at center has a greater height compared to dark gray fabric chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/229639e32e1a62e4.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the museum, and you see a point marked at coordinates point (0.982, 0.019). How far is that point from you?" }, { "from": "gpt", "value": "The point (0.982, 0.019) is 5.91 meters away from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7feef0d54337866.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.055, 0.697) and camera?" }, { "from": "gpt", "value": "Point (0.055, 0.697) is 696.29 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c0d90ad2a0ddc16.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.509, 0.444) or point (0.177, 0.731)?" }, { "from": "gpt", "value": "Point (0.177, 0.731) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adf4c9fbb8f6ef0a.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the white glossy water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.518, 0.597)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad02a32121b76d48.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian standing at the edge of the square. You notice the bare branches at left and the dark blue jacket at center. Which object appears wider from your perspective?" }, { "from": "gpt", "value": "The bare branches at left appears wider than the dark blue jacket at center according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0b27ac610db6c0e.jpg", "conversations": [ { "from": "human", "value": "\nYou are an interior designer assessing the lighting in a room. You notice the clear glass window at upper center and the matte glass window at upper right. Which window is positioned higher in the room?" }, { "from": "gpt", "value": "The clear glass window at upper center is positioned higher in the room as it is located above the matte glass window at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78e0f6e6248a6c2d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, matte black suit at left or red striped tie at left?" }, { "from": "gpt", "value": "matte black suit at left is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfc7339c4f4dcdda.jpg", "conversations": [ { "from": "human", "value": "\nYou are a passenger sitting in the vintage train car and want to enjoy the view outside. Which of the two clear glass windows, the clear glass window at left or the clear glass window at center right, offers a wider field of view?" }, { "from": "gpt", "value": "The clear glass window at left has a larger size compared to the clear glass window at center right, so it offers a wider field of view." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d364fa38078e141f.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of black leather jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.386, 0.416)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73c193dad31b9a5e.jpg", "conversations": [ { "from": "human", "value": "\nIs greenish water at center thinner than rusty metal rail at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d188dbd80cdd49c1.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.217, 0.948) and point (0.395, 0.562), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.395, 0.562) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc72dfb7b601f2ae.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.967, 0.830) and camera?" }, { "from": "gpt", "value": "59.18 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eefc9f27e8c0629a.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of dark gray feathers at center less distant than that of light pink fabric at upper right?" }, { "from": "gpt", "value": "No, dark gray feathers at center is behind light pink fabric at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7abe6c98f0010718.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of dark brown hair at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.673, 0.444)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb36a4132fd95f04.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.457, 0.809) lie behind point (0.227, 0.564)?" }, { "from": "gpt", "value": "No, it is in front of (0.227, 0.564)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/418444bf508c169a.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from green leafy tree at upper center to camera." }, { "from": "gpt", "value": "green leafy tree at upper center is 8.98 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a46bc127234067a8.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte yellow helmet at left and green glass bottle at center, which one is positioned higher?" }, { "from": "gpt", "value": "matte yellow helmet at left is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18744ea9b9183726.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person carrying a box that is 1.5 meters tall. You need to walk through the path between the gray asphalt sidewalk at center and the plaid shirt at center. Can the box fit through the path?" }, { "from": "gpt", "value": "The gray asphalt sidewalk at center has a lesser height compared to plaid shirt at center, so the path between them is at least as tall as the plaid shirt at center. Since the box is 1.5 meters tall, it may not fit if the plaid shirt at center is taller than 1.5 meters. However, without knowing the exact height of the plaid shirt at center, it is impossible to determine for certain." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d9e9ad4b0b05a0b.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance measurement between green marble dome at center and black polished statue at lower right?" }, { "from": "gpt", "value": "A distance of 62.94 meters exists between green marble dome at center and black polished statue at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f7ecb2fc01190d2.jpg", "conversations": [ { "from": "human", "value": "\nLocate striped sweater at center in the image." }, { "from": "gpt", "value": "[(0.386, 0.556)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5f194297cd5ed84.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.140, 0.652) farther from viewer compared to point (0.865, 0.603)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65f9ccd5e08e18ac.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.663, 0.573) or point (0.121, 0.463)?" }, { "from": "gpt", "value": "Point (0.663, 0.573) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1835e5fbca05cee.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.566, 0.170) lie in front of point (0.351, 0.620)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1987d940f518cc8.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.557, 0.750)?" }, { "from": "gpt", "value": "brown cardboard box at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00f7417f638ff1f5.jpg", "conversations": [ { "from": "human", "value": "\nBetween shiny metallic bicycle at center and blue fabric shorts at lower left, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "shiny metallic bicycle at center is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6947e0f2c5e4e1c2.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.487, 0.845) positioned behind point (0.740, 0.836)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9c79f4d1ca4de10.jpg", "conversations": [ { "from": "human", "value": "\nYou are a fashion designer observing a mannequin in a store window displaying clothing items. The mannequin is wearing the beige fabric pants at center and the red matte jacket at center. Which clothing item is taller on the mannequin?" }, { "from": "gpt", "value": "The beige fabric pants at center has a greater height compared to the red matte jacket at center, so the beige fabric pants at center is taller on the mannequin." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98b5d50bb9c61b5c.jpg", "conversations": [ { "from": "human", "value": "\nWhere is brown grass at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.498, 0.181)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7f9df2136af3971.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to navigate through the pedestrian walkway. The brick pavement at center is where you need to walk. Considering the height of the brown textured tree at center, will the tree obstruct your path?" }, { "from": "gpt", "value": "The brick pavement at center is not as tall as brown textured tree at center, so the tree will not obstruct your path since it is taller than the pavement." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7509141ea260e31.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a leopard print dress at center. Pinpoint a point to the leopard print dress at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.625, 0.611)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d76dd24b86fcd9bc.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.737, 0.072) and point (0.713, 0.366), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.713, 0.366) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e072f91220c3481.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, cloudy sky at upper center or green matte roof at center?" }, { "from": "gpt", "value": "cloudy sky at upper center is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35f12667a0c2d9f5.jpg", "conversations": [ { "from": "human", "value": "\nHow far is matte orange paper crown at center from camera?" }, { "from": "gpt", "value": "A distance of 6.09 feet exists between matte orange paper crown at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d233d8a01d4c82d1.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the middle of the scene and want to hand a drink to both the person wearing the white cotton shirt at center and the one wearing the yellow fabric sandal at lower left. Which person should you approach first based on their distance from you?" }, { "from": "gpt", "value": "You should approach the white cotton shirt at center first because it is closer to you than the yellow fabric sandal at lower left, as the white cotton shirt at center is further to the viewer than the yellow fabric sandal at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cc619ece3564924.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between blue water at lower center and camera." }, { "from": "gpt", "value": "blue water at lower center is 288.23 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26a0ed1c8017b769.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte yellow shirt at center is positioned to the right of dark brown fuzzy beard at center?" }, { "from": "gpt", "value": "In fact, matte yellow shirt at center is to the left of dark brown fuzzy beard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b094f4e9a98a0f2.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the blue and yellow patterned dress at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.618, 0.630)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/015dfbc3a70d12af.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to striped sweater at center? Please provide its 2D coordinates.Where can I find striped sweater at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.712, 0.759)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88fdaddf3551385c.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.971, 0.425) from camera?" }, { "from": "gpt", "value": "Point (0.971, 0.425) is 46.06 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/439161ff56637636.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between smooth metallic pole at center and camera?" }, { "from": "gpt", "value": "The distance of smooth metallic pole at center from camera is 24.14 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33ab2501c76ce387.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, brown fuzzy jacket at left or dark blue jeans at center?" }, { "from": "gpt", "value": "Positioned to the right is dark blue jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a915165879e1daca.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.754, 0.516) closer to camera compared to point (0.552, 0.222)?" }, { "from": "gpt", "value": "No, (0.754, 0.516) is further to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9104e4dc806c6883.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte green tank top at center and light beige striped shirt at left, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, light beige striped shirt at left appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/962a62cdacd625c4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if bronze statue at center is taller than bronze cat at center?" }, { "from": "gpt", "value": "Yes, bronze statue at center is taller than bronze cat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70106c6a208434be.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.714, 0.537) and point (0.100, 0.395), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.100, 0.395)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a564992629dfc082.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.860, 0.644) closer to viewer compared to point (0.516, 0.133)?" }, { "from": "gpt", "value": "Yes, point (0.860, 0.644) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce31dc7106c1fac2.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.234, 0.661) or (0.573, 0.566)?" }, { "from": "gpt", "value": "Point (0.234, 0.661)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/715d991b967cf977.jpg", "conversations": [ { "from": "human", "value": "\nThe baby is sitting in a high chair with a green soft bib at center and a yellow matte nose at center. Which object is taller?" }, { "from": "gpt", "value": "The green soft bib at center is taller than the yellow matte nose at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5421b8d44781438.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.036, 0.294) positioned after point (0.359, 0.605)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.359, 0.605)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2efcb40bf9c5b229.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian standing on the sidewalk in front of the shiny black car at center. You want to take a photo of the black brick chimney at upper right without the car blocking it. What should you do?" }, { "from": "gpt", "value": "Move to the side of the shiny black car at center so that the black brick chimney at upper right is no longer blocked by the car." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d0e98acd38c6910.jpg", "conversations": [ { "from": "human", "value": "\nYou are a painter standing in front of the scene, and you need to paint the objects on the left side of the image. Which object should you paint first, the smooth concrete pillar at left or the matte black van at left, considering their widths?" }, { "from": "gpt", "value": "The smooth concrete pillar at left has a smaller width than the matte black van at left, so you should paint the matte black van at left first since it is wider and might cover more of the left side area." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ebd7482eedb54a7.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.697, 0.662) positioned behind point (0.823, 0.561)?" }, { "from": "gpt", "value": "No, (0.697, 0.662) is in front of (0.823, 0.561)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9fc030d4b4005e79.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the matte brown jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.428, 0.725)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0b048a541757002.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray concrete pavement at center appear on the right side of orange metallic ladder at center?" }, { "from": "gpt", "value": "Yes, gray concrete pavement at center is to the right of orange metallic ladder at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd3afbc8a667f572.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, black matte shirt at center or porcelain vase at center?" }, { "from": "gpt", "value": "black matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3fa211c400f76f0.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.475, 0.359) from camera?" }, { "from": "gpt", "value": "A distance of 68.66 feet exists between point (0.475, 0.359) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9542841fb7bb95d1.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance from pink fabric dress at center to matte black shirt at center." }, { "from": "gpt", "value": "pink fabric dress at center is 21.25 inches from matte black shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23efe06f28975c58.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.159, 0.444) from camera?" }, { "from": "gpt", "value": "A distance of 21.01 meters exists between point (0.159, 0.444) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e17a21e80a235d5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white paper at center is positioned to the left of matte black helmet at upper right?" }, { "from": "gpt", "value": "Correct, you'll find white paper at center to the left of matte black helmet at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9dfaff346449211b.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, green fabric uniform at center or black reflective sunglasses at center?" }, { "from": "gpt", "value": "Positioned to the left is black reflective sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e63b53539d21c7c.jpg", "conversations": [ { "from": "human", "value": "\nPoint to green fabric uniform at right.Point to the green fabric uniform at right in the image." }, { "from": "gpt", "value": "[(0.885, 0.778)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d42cf700121ae50d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to white matte uniform at center.Point to the white matte uniform at center in the image." }, { "from": "gpt", "value": "[(0.347, 0.789)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/627865d92cf85e00.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a white soft fabric dress at center. Pinpoint a point to the white soft fabric dress at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.597, 0.389)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b932fa107e9242f.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.540, 0.764) or point (0.631, 0.637)?" }, { "from": "gpt", "value": "Point (0.540, 0.764) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09f9e809cdfbed38.jpg", "conversations": [ { "from": "human", "value": "\nThe child is pointing upwards with their right hand. Based on the scene, which object is closer to the child? The brown fabric at center or the light skin tone flesh at upper center?" }, { "from": "gpt", "value": "The light skin tone flesh at upper center is closer to the child because it is located above the brown fabric at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b603af3a4cdf3f5.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the green rocky mountain at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.317, 0.408)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46ca8da8912d4335.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.082, 0.655) more distant than point (0.941, 0.156)?" }, { "from": "gpt", "value": "No, (0.082, 0.655) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1deca504c1d5836.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position looking at the wooden staircase leading down into the forest. There is a specific point marked at coordinates point (0.228, 0.484). How far is that point from where you are standing?" }, { "from": "gpt", "value": "The point (0.228, 0.484) is 21.51 meters away from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/455944a771bed2f5.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of striped fabric shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.410, 0.661)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92ed626cb72c64b0.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, wooden stairs at center or dark brown leather jacket at lower right?" }, { "from": "gpt", "value": "With more height is wooden stairs at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da6adf999627ff90.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.472, 0.548) or (0.053, 0.709)?" }, { "from": "gpt", "value": "Point (0.053, 0.709) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6536be284ce45149.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between dark blue suit at left and tan quilted jacket at center." }, { "from": "gpt", "value": "dark blue suit at left is 21.56 inches from tan quilted jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d97d0e73126bbacb.jpg", "conversations": [ { "from": "human", "value": "\nIs pale skin at center thinner than smooth tan snake at center?" }, { "from": "gpt", "value": "Correct, pale skin at center's width is less than smooth tan snake at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e8d32fb2a8089d7.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the wooden planks at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.454, 0.861)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64e8b8ee4e990624.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the cliff overlooking the coast. You see the blue water at upper left and the concrete stairs at lower left. Which one appears bigger in the scene?" }, { "from": "gpt", "value": "The blue water at upper left appears bigger in the scene because it has a larger size compared to the concrete stairs at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/328a07c21031693b.jpg", "conversations": [ { "from": "human", "value": "\nBetween brown wooden rail at right and dark gray jacket at center, which one is positioned lower?" }, { "from": "gpt", "value": "brown wooden rail at right is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed3e8e544f8bd417.jpg", "conversations": [ { "from": "human", "value": "\nIs gray glossy horse at center to the right of white matte shirt at center from the viewer's perspective?" }, { "from": "gpt", "value": "Yes, gray glossy horse at center is to the right of white matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/289a08d8d43cb27c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.433, 0.273) or point (0.280, 0.816)?" }, { "from": "gpt", "value": "Point (0.280, 0.816)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09b1c3d7970ffe6b.jpg", "conversations": [ { "from": "human", "value": "\nBetween smooth orange starfish at right and orange matte starfish at left, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "orange matte starfish at left is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67bee220b55890f2.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.659, 0.414) come behind point (0.839, 0.544)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2764c8aa461694ea.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to green leafy tree at center? Please provide its 2D coordinates.Where can I find green leafy tree at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.511, 0.203)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/826f2944f930612f.jpg", "conversations": [ { "from": "human", "value": "\nDoes glossy ceramic teapot at center have a smaller size compared to glossy black countertop at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7ccf75a5778a22f.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between wooden board at center and camera." }, { "from": "gpt", "value": "A distance of 11.82 inches exists between wooden board at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a42e562462decea.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.734, 0.600) or (0.561, 0.484)?" }, { "from": "gpt", "value": "Positioned in front is point (0.734, 0.600)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd62e69627bce8e5.jpg", "conversations": [ { "from": "human", "value": "\nYou are navigating a snowmobile through a snowy landscape. There are two points marked on your map at coordinates point (0.395, 0.559) and point (0.266, 0.525). Which point is closer to the front of the snowmobile?" }, { "from": "gpt", "value": "Point (0.395, 0.559) is in front of point (0.266, 0.525), so the point closer to the front of the snowmobile is point (0.395, 0.559)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c8078b81e8e2dea.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, matte pink basket at center or purple matte shirt at left, stands taller?" }, { "from": "gpt", "value": "purple matte shirt at left is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0805681cbbf9cfc3.jpg", "conversations": [ { "from": "human", "value": "\nWhere is brown textured suit at right located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.839, 0.631)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13dfa8c6e4bddc88.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.435, 0.630) and camera." }, { "from": "gpt", "value": "Point (0.435, 0.630) and camera are 16.62 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c707cdb093f92efd.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker planning to take a photo of the matte red backpack at left and the concrete pole at right. Which object should you zoom in on to capture both in the frame without moving your camera?" }, { "from": "gpt", "value": "You should zoom in on the matte red backpack at left because the concrete pole at right is larger in size than the matte red backpack at left, so focusing on the smaller object allows both to fit in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd52eaa2039214d8.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.962, 0.539) or (0.277, 0.548)?" }, { "from": "gpt", "value": "Positioned behind is point (0.962, 0.539)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/550c3307eb9a86be.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a candid shot of the two children in the center of the image. The denim shirt at center and the light blue fabric shirt at center are both in your frame. Which child should you focus on if you want to ensure the closest one to the camera is in sharp focus?" }, { "from": "gpt", "value": "You should focus on the denim shirt at center because it is closer to the viewer than the light blue fabric shirt at center, making it the closer child to the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00524871590f8b4f.jpg", "conversations": [ { "from": "human", "value": "\nYou are an archaeologist measuring the distance between the white marble statue at center and the smooth stone column at center in the ancient stone structure. What is the distance between them?" }, { "from": "gpt", "value": "The distance between the white marble statue at center and the smooth stone column at center is 7.16 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b43a12f2c9e38ce9.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a blue fabric tent at center. Pinpoint a point to the blue fabric tent at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.387, 0.595)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d93b490a89b754c8.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.545, 0.773) come farther from viewer compared to point (0.188, 0.397)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/641730c7f086f7a6.jpg", "conversations": [ { "from": "human", "value": "\nWhere is red matte sign at lower center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.737, 0.848)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3883bfbfac5f21b2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and want to take a photo of the black satin dress at upper left and the clear glass wine glass at lower left. Which object is positioned to the left of the other?" }, { "from": "gpt", "value": "The black satin dress at upper left is to the left of the clear glass wine glass at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c476e41186291584.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the matte gray cap at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.298, 0.420)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75963c74214764e7.jpg", "conversations": [ { "from": "human", "value": "\nCould you provide the distance between steampunk vest at center and matte white ribbon at center?" }, { "from": "gpt", "value": "steampunk vest at center and matte white ribbon at center are 16.93 inches apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/781055b49d6589fe.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.855, 0.631) from camera?" }, { "from": "gpt", "value": "Point (0.855, 0.631) and camera are 7.05 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64c44dadc6e3affd.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.748, 0.370) or (0.028, 0.495)?" }, { "from": "gpt", "value": "Positioned in front is point (0.028, 0.495)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3b829ad9fccb8de.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.810, 0.902)?" }, { "from": "gpt", "value": "dark blue jacket at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0d6c82af520b167.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.695, 0.545) positioned after point (0.147, 0.589)?" }, { "from": "gpt", "value": "Yes, point (0.695, 0.545) is farther from viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc3286a704b691e8.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the black neoprene wetsuit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.558, 0.625)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d05b178ac26bc203.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.278, 0.320) closer to camera compared to point (0.287, 0.456)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f337d39bde99c3f9.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tourist visiting the lighthouse and want to take a photo of the dark blue water at lower center and the glossy black car at lower right. Which object appears larger in the photo?" }, { "from": "gpt", "value": "The dark blue water at lower center appears larger in the photo because it is taller than the glossy black car at lower right according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a07d64d69b7e3a6.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.489, 0.542) behind point (0.180, 0.197)?" }, { "from": "gpt", "value": "No, (0.489, 0.542) is in front of (0.180, 0.197)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/958f8fa39f0bc645.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of black matte jacket at center from camera?" }, { "from": "gpt", "value": "black matte jacket at center is 4.50 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed8b5791aee9774e.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of red concrete pillar at left less distant than that of matte orange pillar at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b9a4ae9c9e2946d.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is white stone pillar at center from camera?" }, { "from": "gpt", "value": "white stone pillar at center and camera are 292.94 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b275c5f193ef362.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.452, 0.308) or point (0.508, 0.919)?" }, { "from": "gpt", "value": "The point (0.452, 0.308) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ff2bfa33e188524.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white checkered shirt at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.207, 0.670)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43593db4393c33af.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of green rough bark tree at right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.938, 0.653)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db4f93703165a5e1.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of brown furry dog at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.818, 0.550)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9fc993b7095496a8.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.209, 0.648) closer to camera compared to point (0.432, 0.508)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/490aa2a997c2925a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing outside the green corrugated metal cabin at center and want to throw a ball to your friend who is standing 5 meters away from you. Can you reach your friend with the throw?" }, { "from": "gpt", "value": "The distance between you and your friend is 5 meters, which is less than the 6.02 meters between you and the green corrugated metal cabin at center. Since the cabin is farther away than your friend, you can successfully throw the ball to your friend without the cabin obstructing the path." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2274fad1c212f948.jpg", "conversations": [ { "from": "human", "value": "\nIs translucent yellow plastic at upper center to the left of black plastic piece at lower center from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, translucent yellow plastic at upper center is not on the left side of black plastic piece at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc69dd25a4f38418.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the black matte tank top at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.168, 0.736)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bae5f2a2c311cde3.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the matte blue building at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.518, 0.481)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9421194946c4c9c.jpg", "conversations": [ { "from": "human", "value": "\nDoes rough bark tree at center have a lesser width compared to brick paved sidewalk at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c5c4949b74c4c15.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at point (0.297, 0.420) and want to walk to point (0.835, 0.378). Which direction should you move in relation to the sofa?" }, { "from": "gpt", "value": "You should move behind the sofa to reach point (0.835, 0.378) from point (0.297, 0.420) because point (0.835, 0.378) is behind point (0.297, 0.420)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e67ce6f4aecfea33.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the distance between gray cotton shirt at center and light pink fabric at lower left?" }, { "from": "gpt", "value": "A distance of 3.63 feet exists between gray cotton shirt at center and light pink fabric at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d1a92d6522fdd7d.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.547, 0.683) closer to camera compared to point (0.071, 0.172)?" }, { "from": "gpt", "value": "Yes, point (0.547, 0.683) is in front of point (0.071, 0.172)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf045c2e5d5961f0.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.948, 0.427) or (0.925, 0.506)?" }, { "from": "gpt", "value": "Positioned in front is point (0.925, 0.506)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/002f645263e7ac99.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.713, 0.347) closer to camera compared to point (0.420, 0.623)?" }, { "from": "gpt", "value": "Yes, point (0.713, 0.347) is in front of point (0.420, 0.623)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f457799452a9e810.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.426, 0.102) closer to viewer compared to point (0.894, 0.231)?" }, { "from": "gpt", "value": "No, (0.426, 0.102) is behind (0.894, 0.231)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d87b600d0993dbf0.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, green leafy tree at upper right or green leafy tree at upper left?" }, { "from": "gpt", "value": "Positioned higher is green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca690831ae5c6383.jpg", "conversations": [ { "from": "human", "value": "\nYou are an explorer navigating through the tropical landscape. You see a green leafy tree at center and a green leafy palm tree at upper right. Which tree is positioned higher up in the image?" }, { "from": "gpt", "value": "The green leafy palm tree at upper right is positioned higher up in the image than the green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01ec475c41116612.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.335, 0.703) or (0.171, 0.467)?" }, { "from": "gpt", "value": "The point (0.171, 0.467) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d33801752ad3b64e.jpg", "conversations": [ { "from": "human", "value": "\nBetween gray tile fireplace at center and white glass window at upper left, which one has less height?" }, { "from": "gpt", "value": "white glass window at upper left is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68187e0ac009e483.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.691, 0.208) and point (0.845, 0.014), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.845, 0.014) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e09956473fc86d7.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the balcony and want to place a small potted plant exactly where the matte black jacket at left is located. Is this possible?" }, { "from": "gpt", "value": "Yes, since the matte black jacket at left is located at coordinates point (0.216, 0.575), you can place the potted plant there." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8675c6d2069a13a9.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte red shirt at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.467, 0.634)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68f14a7e49a5b8c0.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the beach and see two points marked in the image. Which point, point (0.405, 0.931) or point (0.411, 0.747), is closer to you?" }, { "from": "gpt", "value": "Point (0.405, 0.931) is closer to the camera than point (0.411, 0.747)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/539c05145c78229b.jpg", "conversations": [ { "from": "human", "value": "\nWhere is the beige striped suit at center located in the image?" }, { "from": "gpt", "value": "The beige striped suit at center is located at point (0.345, 0.580) in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f2d8411b4542a9c.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the black wire at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.512, 0.059)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7155d3aaa68ee4a8.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of smooth skin hand at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.847, 0.531)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f561df19e9dab314.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a clothing donation drive and need to determine which items are suitable for adult sizes. You see two shirts in the center of the image, a striped cotton shirt at center and a blue fabric shirt at center. Which one is more likely to be an adult size?" }, { "from": "gpt", "value": "The striped cotton shirt at center has a larger size compared to the blue fabric shirt at center, so it is more likely to be an adult size." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf8c27f985f53d16.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, black wrought iron fence at center or wooden railing at upper center?" }, { "from": "gpt", "value": "Positioned to the left is wooden railing at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c174ee2249f64398.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, black pinstripe suit at left or white satin dress at center?" }, { "from": "gpt", "value": "white satin dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b11147e221803a42.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the market and want to pick up the brown woolen jacket at right. How far do you need to reach to grab it?" }, { "from": "gpt", "value": "The brown woolen jacket at right is 2.08 meters away from the viewer, so you need to reach 2.08 meters to grab it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ff5caac005bde1e.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.182, 0.644) from camera?" }, { "from": "gpt", "value": "Point (0.182, 0.644) is 1.09 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/523b686f90c8bd83.jpg", "conversations": [ { "from": "human", "value": "\nYou are attending an outdoor event and want to find the main entrance. You see the red brick stadium at center and the white fabric canopy at lower right. Which object is closer to the main entrance based on their positions?" }, { "from": "gpt", "value": "The red brick stadium at center is positioned on the left side of white fabric canopy at lower right, so the white fabric canopy at lower right is closer to the main entrance since it is positioned to the right of the stadium." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62a5e1822f783979.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the shiny metallic bowl at upper right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.872, 0.223)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae094ffb0bb663c1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a tailor observing a meeting scene. You need to adjust the length of the blue striped tie at right and the maroon silk tie at center so that both have the same height. Which tie needs to be shortened?" }, { "from": "gpt", "value": "The blue striped tie at right is taller than the maroon silk tie at center, so the blue striped tie at right needs to be shortened to match the height of the maroon silk tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3cad712e2aac0c96.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.752, 0.258) closer to viewer compared to point (0.168, 0.211)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73a98898a5893da4.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of white corrugated metal hut at right in the image." }, { "from": "gpt", "value": "[(0.952, 0.502)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c712348b31116e7.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white fluffy cloud at upper center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.725, 0.434)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5633e02f1cef76f.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.639, 0.481) or point (0.865, 0.564)?" }, { "from": "gpt", "value": "Positioned in front is point (0.865, 0.564)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e20263780b92acd6.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any green grassy at center in the image." }, { "from": "gpt", "value": "[(0.552, 0.847)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b91255ab863a56f8.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, light brown cotton shirt at center or transparent plastic microphone at center?" }, { "from": "gpt", "value": "Positioned to the left is transparent plastic microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/408ffc4cba3160f4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white marble railing at upper center is bigger than clear water at right?" }, { "from": "gpt", "value": "No, white marble railing at upper center is not bigger than clear water at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/547757cb784db085.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte shirt at center shorter than green wood table at center?" }, { "from": "gpt", "value": "No, white matte shirt at center is not shorter than green wood table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64f93aa2617f9114.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is black matte singlet at left from hairy skin at center?" }, { "from": "gpt", "value": "They are 25.26 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4b2edfbaa17a981.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the black fabric dress at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.163, 0.722)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a38ee0ba18395e3c.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between black matte t-shirt at center and white fabric shirt at center." }, { "from": "gpt", "value": "black matte t-shirt at center is 2.04 meters from white fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/006017783a8beb66.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is shiny black car at center from camera?" }, { "from": "gpt", "value": "The distance of shiny black car at center from camera is 8.22 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa03515220eb2f0f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a guest in this grand room and want to greet the person with blonde hair at lower left. Where should you walk to approach them?" }, { "from": "gpt", "value": "The blonde hair at lower left is located at point (0.233, 0.928), so you should walk towards the lower left direction to approach them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91e20aefa3177704.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from brown stone church at center to camera." }, { "from": "gpt", "value": "A distance of 35.78 meters exists between brown stone church at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b10bf6d30ba43a9.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker trying to read the trail directions on the wooden signpost at center. However, the green mossy tree at center is blocking your view. Can you move around the tree to get a better look at the signpost?" }, { "from": "gpt", "value": "The green mossy tree at center is larger in size than wooden signpost at center, so it might block your view. To get a better look at the wooden signpost at center, you should move around the tree to find an unobstructed path where the tree is no longer in front of the signpost." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27d4b84969de7a88.jpg", "conversations": [ { "from": "human", "value": "\nLocate the floral kimono at center in the image." }, { "from": "gpt", "value": "[(0.354, 0.569)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd72ea52554bbdeb.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of clear water at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.775, 0.584)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/187315eda9c6259c.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.964, 0.834) or (0.345, 0.422)?" }, { "from": "gpt", "value": "Point (0.964, 0.834)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3935eedca134c31.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who wants to take a photo of both the brown bark tree at upper left and the smooth brown tree trunk at upper left. Since you have a camera with a fixed focal length, you need to know which one is larger to ensure both fit in the frame. Which one is bigger?" }, { "from": "gpt", "value": "The brown bark tree at upper left is bigger than the smooth brown tree trunk at upper left, so you should position your camera to focus on the brown bark tree at upper left to ensure both fit in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef1b4f7db09bdf74.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, golden brown pastry at lower left or yellow matte cookie at right?" }, { "from": "gpt", "value": "golden brown pastry at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df3bc227b1d61831.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a group shot of the blue matte cap at center and the black leather boots at left. The camera you are using has a maximum focusing distance of 5 meters. Will you be able to focus on both objects simultaneously?" }, { "from": "gpt", "value": "The blue matte cap at center is 5.09 meters away from the black leather boots at left. Since the maximum focusing distance is 5 meters, the distance between them exceeds the camera capability, so you cannot focus on both simultaneously." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1f8a0acab223cde.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of black glossy ant at upper right. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.846, 0.298)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0079ea281058458c.jpg", "conversations": [ { "from": "human", "value": "\nLocate the denim shorts at center in the image." }, { "from": "gpt", "value": "[(0.461, 0.573)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad4785509f615598.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the gray concrete dam at center and want to walk back to your car parked at the starting point, which is 20 meters away from the dam. Can you reach your car without needing to walk more than 20 meters?" }, { "from": "gpt", "value": "The distance between the gray concrete dam at center and the camera is 17.06 meters. Since your car is parked 20 meters away from the dam, you can reach it by walking back towards the camera direction, as 17.06 meters is less than 20 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc87fd634e2e97b7.jpg", "conversations": [ { "from": "human", "value": "\nHow close is painted wood statue at center from camera?" }, { "from": "gpt", "value": "painted wood statue at center is 5.11 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/148038322d24570b.jpg", "conversations": [ { "from": "human", "value": "\nYou are an observer standing on the pier where the metallic gray boat at center and the white plastic boat at lower center are docked. Which boat is positioned higher relative to the other?" }, { "from": "gpt", "value": "The metallic gray boat at center is positioned higher than the white plastic boat at lower center because it is located above it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5adbba6ef88da9f4.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte gray sedan at center and satin silver car at lower left, which one is positioned lower?" }, { "from": "gpt", "value": "matte gray sedan at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07b7a9c5da6b9dc5.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the yellow matte shirt at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.126, 0.725)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/021d6c94ceb01bd6.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.111, 0.967) lie behind point (0.301, 0.327)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a02c5a066069179.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.380, 0.358)?" }, { "from": "gpt", "value": "white glossy building at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21f9ebe3f1d1ad83.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.717, 0.456) or point (0.452, 0.875)?" }, { "from": "gpt", "value": "Point (0.452, 0.875) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58d47620a0b31818.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up a shoot in the scene described. You need to place a small prop between the black leather shoe at upper center and the black leather neckband at upper center. Which object should the prop be closer to if you want it to be visually balanced based on their heights?" }, { "from": "gpt", "value": "The black leather shoe at upper center is taller than the black leather neckband at upper center. To achieve visual balance, the prop should be placed closer to the black leather neckband at upper center since it is shorter, compensating for the height difference between the two objects." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81dee5c42b15b62d.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of orange smooth jumpsuit at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.217, 0.677)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77b040d9754ac244.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point marked as point (0.246, 0.205). If you walk straight towards it, how far will you have to walk?" }, { "from": "gpt", "value": "The point (0.246, 0.205) is 56.54 feet away from the camera, so you will have to walk 56.54 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59394ec5fada3878.jpg", "conversations": [ { "from": "human", "value": "\nHow far is silver satin shirt at right from camera?" }, { "from": "gpt", "value": "silver satin shirt at right is 1.78 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44afa93f55108479.jpg", "conversations": [ { "from": "human", "value": "\nYou are a visitor standing in front of the architectural structure. You notice the white corrugated metal sheep head at right and the white matte dog head at left. Which object is closer to you?" }, { "from": "gpt", "value": "The white corrugated metal sheep head at right is positioned over the white matte dog head at left, meaning it is closer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f508ee6b6d60526e.jpg", "conversations": [ { "from": "human", "value": "\nWhere is gray herringbone blazer at left located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.226, 0.644)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0aeed3c34b12873e.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.984, 0.847) or (0.473, 0.711)?" }, { "from": "gpt", "value": "Point (0.984, 0.847) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67b5c76ef9663887.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte black top hat at center and shiny black suit at upper right, which one is positioned lower?" }, { "from": "gpt", "value": "Positioned lower is matte black top hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b9331c8c966aa75.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, white glossy drawer at lower right or golden crispy french fries at center, stands taller?" }, { "from": "gpt", "value": "white glossy drawer at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd8a86b4b9d08199.jpg", "conversations": [ { "from": "human", "value": "\nBetween white matte blazer at center and yellow silk sari at center, which one has less height?" }, { "from": "gpt", "value": "yellow silk sari at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b58128e69ae1a822.jpg", "conversations": [ { "from": "human", "value": "\nIs metal/wooden ledge at center smaller than matte orange cone at center?" }, { "from": "gpt", "value": "No, metal/wooden ledge at center is not smaller than matte orange cone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd2e89bacd400805.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.576, 0.973) lie behind point (0.333, 0.539)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ef466537d140ba9.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of green liquid water at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.500, 0.887)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c41fc963e5c42cdf.jpg", "conversations": [ { "from": "human", "value": "\nIs brown woolen sweater at lower right to the right of matte black t-shirt at lower left from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, brown woolen sweater at lower right is positioned on the right side of matte black t-shirt at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cdf6c9002c3e4cfa.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the matte black blazer at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.643, 0.527)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02d05d4671975463.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic silver mirror at center below matte black camera at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c90e7b1369db46c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy plate at center is positioned to the right of matte brown plate at center?" }, { "from": "gpt", "value": "Correct, you'll find white glossy plate at center to the right of matte brown plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2cfbdf0c9acdb702.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the red glossy flag at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.192, 0.508)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e604520f33f1d19e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue glossy bus at center is thinner than blue fabric pants at lower center?" }, { "from": "gpt", "value": "Yes, blue glossy bus at center is thinner than blue fabric pants at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dda32fb700539a10.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.689, 0.397) or point (0.715, 0.522)?" }, { "from": "gpt", "value": "Point (0.689, 0.397)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/989efb8f156c95d4.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte jacket at center have a lesser height compared to brown fur dog at right?" }, { "from": "gpt", "value": "In fact, black matte jacket at center may be taller than brown fur dog at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a4c63c81f7fb340.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the rustic stone bridge and want to know where the metallic brown rail at upper center is located. According to the coordinates given, what are its exact coordinates?" }, { "from": "gpt", "value": "The metallic brown rail at upper center is located at coordinates point (0.157, 0.267)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5ed79e8eb492765.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.837, 0.362)?" }, { "from": "gpt", "value": "smooth skin face at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53454f618136924e.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, orange plastic kayak at lower center or green leafy trees at upper center?" }, { "from": "gpt", "value": "orange plastic kayak at lower center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c222ae539e14d8f9.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between green textured hill at center and green matte tree at lower center?" }, { "from": "gpt", "value": "green textured hill at center and green matte tree at lower center are 9.17 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c65e6d069f7ac0d0.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of black matte suit at center in the image." }, { "from": "gpt", "value": "[(0.300, 0.669)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aae2c76fd177c542.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green leafy tree at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.091, 0.512)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f98a730ba8d8194c.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of gray asphalt road at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.481, 0.866)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdca5261ca848305.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, black suit at left or smooth gray suit at center?" }, { "from": "gpt", "value": "From the viewer's perspective, black suit at left appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bd3a029037b0d3c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of green textured tree at center?" }, { "from": "gpt", "value": "A distance of 7.34 meters exists between green textured tree at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/836ad67af7aefc96.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the camouflage fabric pants at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.208, 0.617)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/371c8961494fe757.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the vantage point overlooking the ocean and islands. There is a specific point marked at coordinates point (0.615, 0.878) in your field of view. You have a laser pointer that can reach up to 4 meters. Can your laser pointer reach that point?" }, { "from": "gpt", "value": "The point (0.615, 0.878) is 3.57 meters away from the viewer, so yes, the laser pointer can reach it since its range is within the 4 meters limit." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d490cc2bc38f382.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.897, 0.822)?" }, { "from": "gpt", "value": "yellow plastic slide at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c71e2d3efa60c3f6.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, green woolen suit at center or green furry puppet at center?" }, { "from": "gpt", "value": "green woolen suit at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8105282a9ac147d.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte shirt at center appear under black smooth shirt at center?" }, { "from": "gpt", "value": "Yes, green matte shirt at center is below black smooth shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5d4a8ab55da1cfe.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the dark gray t-shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.552, 0.537)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83ef89a160c4d262.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the railway station platform and want to take a photo of both the point at coordinates (0.835, 0.541) and the point at coordinates (0.658, 0.614). Which point should you focus on first to ensure both are in clear view?" }, { "from": "gpt", "value": "You should focus on point (0.835, 0.541) first because it is closer to the camera than point (0.658, 0.614), ensuring both points are in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9192d22a5bf5b06b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, white rubber asphalt spreader at center or orange reflective road roller at center?" }, { "from": "gpt", "value": "white rubber asphalt spreader at center is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd8451f2f3bd8094.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of matte brown dog at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.762, 0.539)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b70834f5c45fed2.jpg", "conversations": [ { "from": "human", "value": "\nWhere is wooden table at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.412, 0.877)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7e32216849ef84d.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from silver metallic car at lower left to camera." }, { "from": "gpt", "value": "A distance of 51.63 meters exists between silver metallic car at lower left and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f00b4e12f7f4ea5a.jpg", "conversations": [ { "from": "human", "value": "\nDoes white textured statue at center have a greater height compared to green translucent fish at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc2371af7b30e3f8.jpg", "conversations": [ { "from": "human", "value": "\nHow distant is matte gray sedan at center from silver metallic sedan at right?" }, { "from": "gpt", "value": "matte gray sedan at center is 12.51 feet away from silver metallic sedan at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/725bd81ac6bcc4b4.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white glossy seaplane at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.559, 0.652)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e640a24031c343f8.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of navy blue fabric uniform at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.595, 0.814)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bea029bdc389f82a.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to black plastic chair at lower center? Please provide its 2D coordinates.Where can I find black plastic chair at lower center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.518, 0.906)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ffad5dd52c3cab8.jpg", "conversations": [ { "from": "human", "value": "\nIs matte white lounge chair at center to the left of matte beige chair at lower right from the viewer's perspective?" }, { "from": "gpt", "value": "Yes, matte white lounge chair at center is to the left of matte beige chair at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2d2912e2affa261.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the group of eight individuals. You need to locate two specific points marked in the image. The first point is at coordinate point(0.726, 0.809) and the second is at point(0.261, 0.444). Which of these two points is closer to you?" }, { "from": "gpt", "value": "Point(0.726, 0.809) is in front of point(0.261, 0.444), so it is closer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3df7b30a90d345ea.jpg", "conversations": [ { "from": "human", "value": "\nDoes colorful paper cake at center lie in front of matte pink cake at center?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/509b1ec2f3e507b9.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.000, 0.798) and camera." }, { "from": "gpt", "value": "They are 152.88 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74b52f10a5fd3596.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth concrete waterway at center is taller than brown cotton shirt at center?" }, { "from": "gpt", "value": "Correct, smooth concrete waterway at center is much taller as brown cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c899b5c3145450c.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.414, 0.802)?" }, { "from": "gpt", "value": "wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fca8afd56ef7495.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.624, 0.783) or (0.213, 0.478)?" }, { "from": "gpt", "value": "Positioned behind is point (0.213, 0.478)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c058af4c9a085e7a.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.944, 0.491) and camera." }, { "from": "gpt", "value": "They are 13.20 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8540e0f1684f9b6.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, matte brown jacket at left or fuzzy brown dog at center?" }, { "from": "gpt", "value": "From the viewer's perspective, matte brown jacket at left appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a221ef12765f8afd.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white smooth clock tower at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.607, 0.530)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b56092c89ed919d.jpg", "conversations": [ { "from": "human", "value": "\nDoes red matte star at upper center appear on the right side of blue fleece jacket at center?" }, { "from": "gpt", "value": "Incorrect, red matte star at upper center is not on the right side of blue fleece jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/005b85e75c666374.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray concrete bridge at upper left is thinner than dark gray jacket at center?" }, { "from": "gpt", "value": "Incorrect, gray concrete bridge at upper left's width is not less than dark gray jacket at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/858eb4b4f3b019e1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a painter who needs to place a 15 cm wide painting on the table. The table is between the brown matte table at center and the matte black hand at left. Can the painting fit on the table?" }, { "from": "gpt", "value": "The brown matte table at center might be wider than matte black hand at left, so the painting could fit if the table is wide enough. However, since the exact width isn t specified, it s uncertain. Please measure the table first." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9181c8b7e316ff2a.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of brown stone bridge at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.504, 0.742)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb377796c8bb96ee.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of silver metallic suv at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.455, 0.769)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cac08cd6ecb07a58.jpg", "conversations": [ { "from": "human", "value": "\nYou are setting up a new monitor in the office. The black glossy monitor at center needs to be placed on the brown wooden table at lower left. Is there enough space for the monitor?" }, { "from": "gpt", "value": "The black glossy monitor at center is positioned over the brown wooden table at lower left, so yes, there is enough space for the monitor on the brown wooden table at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7df89eb120a7f522.jpg", "conversations": [ { "from": "human", "value": "\nIs stainless steel oven at center wider than satin steel sink at center?" }, { "from": "gpt", "value": "Indeed, stainless steel oven at center has a greater width compared to satin steel sink at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f5ea232839b6dfd.jpg", "conversations": [ { "from": "human", "value": "\nYou are an art student analyzing the sculpture and its surroundings. From your vantage point, does the bronze sculpture at center appear higher or lower than the smooth concrete pillar at center right?" }, { "from": "gpt", "value": "The bronze sculpture at center is located below the smooth concrete pillar at center right, so it appears lower than the pillar." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66c29aa8cf5580e3.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white fluffy snow at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.481, 0.898)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02a75c2104ff40b8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic silver truck at center is positioned above straw hat at center?" }, { "from": "gpt", "value": "No, metallic silver truck at center is not above straw hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cd899189a4ccb9f.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, white matte car at lower right or shiny black car at center?" }, { "from": "gpt", "value": "shiny black car at center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1740552c7dd4dc1.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between matte plastic puzzle pieces at center and camera." }, { "from": "gpt", "value": "The distance of matte plastic puzzle pieces at center from camera is 6.06 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b388df1713885dd5.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.749, 0.205) less distant than point (0.452, 0.256)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.452, 0.256)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e4c5b41c857efea.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.143, 0.959) and point (0.374, 0.438), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.143, 0.959) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcaf5afc1e54ddaa.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray fabric jacket at center thinner than purple fabric at center?" }, { "from": "gpt", "value": "In fact, dark gray fabric jacket at center might be wider than purple fabric at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3fe75abfc49c61c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a candid shot of the matte fleece jacket at center and the white rubber shoe at lower right. Based on their positions, which object should you focus on first to ensure both are in the frame?" }, { "from": "gpt", "value": "The matte fleece jacket at center is below the white rubber shoe at lower right, so you should focus on the white rubber shoe at lower right first to ensure both are in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f503930b8287ae41.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the scene and want to walk from the green grassy hillside at lower left to the green leafy tree at center. Which direction should you move to get closer to the tree?" }, { "from": "gpt", "value": "To get closer to the green leafy tree at center, you should move away from the green grassy hillside at lower left since it is closer to the viewer than the tree." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7645f563a4207985.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.847, 0.673) and point (0.793, 0.405), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.793, 0.405)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9fc8c8aeef760c7.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the yellow striped surfboard at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.070, 0.673)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/374d2c762094371c.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.158, 0.867) and point (0.883, 0.900), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.158, 0.867)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2454fff8e865c0c3.jpg", "conversations": [ { "from": "human", "value": "\nDoes blonde paper mask at center appear on the right side of smooth skin face at center?" }, { "from": "gpt", "value": "No, blonde paper mask at center is not to the right of smooth skin face at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b289def9676bbdc5.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.617, 0.177) or (0.941, 0.206)?" }, { "from": "gpt", "value": "Point (0.617, 0.177)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7ac7c8ce069067f.jpg", "conversations": [ { "from": "human", "value": "\nDoes white textured bark at center have a lesser width compared to clear glass window at center?" }, { "from": "gpt", "value": "Incorrect, white textured bark at center's width is not less than clear glass window at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aab449d7184ac9a0.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green matte shorts at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.437, 0.477)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b97ecb8e9446ed2.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of green grassy hillside at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.436, 0.816)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d41184195349329c.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, matte gray sweater at center or plaid flannel shirt at upper right?" }, { "from": "gpt", "value": "plaid flannel shirt at upper right is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80176b4183baeeac.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.752, 0.236) lie behind point (0.480, 0.858)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3724da57dd538c08.jpg", "conversations": [ { "from": "human", "value": "\nPoint to rusty metal train at center.Point to the rusty metal train at center in the image." }, { "from": "gpt", "value": "[(0.576, 0.609)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04d16de390eef81e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator trying to capture aerial footage of the brown sandy dirt field at center and the white cotton shirt at center. Which object should you focus on first if you want to film from top to bottom?" }, { "from": "gpt", "value": "The brown sandy dirt field at center is taller than the white cotton shirt at center, so you should focus on the brown sandy dirt field at center first when filming from top to bottom." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2169eaa9bd613c2.jpg", "conversations": [ { "from": "human", "value": "\nBetween blue matte jacket at lower right and plaid shirt at lower left, which one is positioned lower?" }, { "from": "gpt", "value": "blue matte jacket at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52825a1c126e699e.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the pale skin at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.298, 0.766)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13f6a7e70b53ecd1.jpg", "conversations": [ { "from": "human", "value": "\nHow close is dark gray pinstripe suit at left from camera?" }, { "from": "gpt", "value": "dark gray pinstripe suit at left is 7.06 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46a97d21d4b18336.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.269, 0.116) positioned in front of point (0.261, 0.369)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7490319f2f74b627.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the two people holding the rivalry signs. You want to take a photo of the person holding the sign with the cardinal graphic. How far should you stand from the point at coordinates point (0.194, 0.789) to capture them clearly?" }, { "from": "gpt", "value": "You should stand approximately 2.76 meters away from the point at coordinates point (0.194, 0.789) to capture the person holding the cardinal graphic sign clearly, as that is the distance between the point and the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76d9cb92c2ad9ed3.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any matte black suit at left in the image." }, { "from": "gpt", "value": "[(0.274, 0.648)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da41e8fd48aa8f9c.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.767, 0.628) to camera." }, { "from": "gpt", "value": "Point (0.767, 0.628) is 11.43 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d74020ca592b4256.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green leafy tree at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.442, 0.797)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d8c4f12ed5c2a65.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and need to capture a shot where both the dark wool suit at center and the suede jacket at right are visible. Based on their positions, which one should you ensure is closer to the left side of your camera frame?" }, { "from": "gpt", "value": "The dark wool suit at center is to the left of the suede jacket at right, so to ensure both are visible, the dark wool suit at center should be positioned on the left side of the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e093e912f77fe96b.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a group photo. You have a 10 inch wide prop that needs to be placed between the blue satin shirt at center and the fuzzy fur vest at right. Will there be enough space to fit the prop between them?" }, { "from": "gpt", "value": "The blue satin shirt at center is 9.98 inches from the fuzzy fur vest at right, so the 10 inch wide prop will not fit between them as the distance is slightly less than the prop width." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e408cd2aaba1b890.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, dark gray uniform at right or gray uniformed man at upper left, stands shorter?" }, { "from": "gpt", "value": "dark gray uniform at right is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4899bd62624703f9.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the blue fabric at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.775, 0.759)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9af02a9cd9d0c35.jpg", "conversations": [ { "from": "human", "value": "\nYou are a food critic evaluating the presentation of the guacamole. Considering the green creamy guacamole at center and the black shirt at upper center, which one takes up more visual space in the image?" }, { "from": "gpt", "value": "The black shirt at upper center occupies more visual space than the green creamy guacamole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1941acaaa3759d7.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.584, 0.512) or point (0.816, 0.916)?" }, { "from": "gpt", "value": "Point (0.816, 0.916) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/230c14abcd0c0f94.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.706, 0.542) or (0.904, 0.778)?" }, { "from": "gpt", "value": "Point (0.904, 0.778)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e1ab7e4e71a06dd.jpg", "conversations": [ { "from": "human", "value": "\nYou are at the water park and see the orange plastic kayak at left and the brown fur at lower right. Which object is larger?" }, { "from": "gpt", "value": "The orange plastic kayak at left is bigger than the brown fur at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eaf2aa932d6cf096.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, gold glossy horse at center or red velvet poinsettia at center?" }, { "from": "gpt", "value": "Positioned to the right is gold glossy horse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23336fc608785ae7.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.343, 0.566) or (0.804, 0.853)?" }, { "from": "gpt", "value": "The point (0.804, 0.853) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8230f0adbe88b279.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a matte black glasses at center. Pinpoint a point to the matte black glasses at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.781, 0.622)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76d3ac8c82351900.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.873, 0.713) from camera?" }, { "from": "gpt", "value": "Point (0.873, 0.713) is 14.67 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58b4f3eeae6a92f9.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position looking at the urban scene. There is a point marked at coordinates point (0.792, 0.670). How far is that point from you?" }, { "from": "gpt", "value": "The point (0.792, 0.670) is 69.60 meters away from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/181596df2d9a23cd.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.073, 0.222) or (0.033, 0.211)?" }, { "from": "gpt", "value": "The point (0.073, 0.222) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2abec3df2dcc9a3b.jpg", "conversations": [ { "from": "human", "value": "\nLocate blue plastic slide at center in the image." }, { "from": "gpt", "value": "[(0.183, 0.780)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62866a82188f838d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of brown glazed vase at lower left in the image." }, { "from": "gpt", "value": "[(0.186, 0.745)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a61934cf953886d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in the restaurant and want to take a picture of both the camera on the table and the person making dough. Which object is closer to you, the point representing the camera at point (0.747, 0.839) or the point representing the person making dough at point (0.854, 0.852)?" }, { "from": "gpt", "value": "The point representing the camera at point (0.747, 0.839) is closer to you than the point representing the person making dough at point (0.854, 0.852) because it is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c766687a6e12f6f0.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.807, 0.855) and point (0.529, 0.761), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.529, 0.761) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/686d19ea7838f861.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of bronze sculpture at center from camera?" }, { "from": "gpt", "value": "The distance of bronze sculpture at center from camera is 3.39 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ec2f591b81edc6d.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.048, 0.920) or (0.140, 0.961)?" }, { "from": "gpt", "value": "Point (0.140, 0.961)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc08d6bfbe2ae7b4.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.299, 0.748) from the camera?" }, { "from": "gpt", "value": "Point (0.299, 0.748) is 67.66 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c75494020af94668.jpg", "conversations": [ { "from": "human", "value": "\nYou are a jewelry designer examining the image of the earrings. You need to determine which object takes up more space between the black crystal earrings at center and the black crystal cluster at center. Which one is it?" }, { "from": "gpt", "value": "The black crystal cluster at center takes up more space than the black crystal earrings at center, as the description states that the black crystal earrings at center occupies less space than the black crystal cluster at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb924c16816f086b.jpg", "conversations": [ { "from": "human", "value": "\nPoint to white sheer robe at lower center.Point to the white sheer robe at lower center in the image." }, { "from": "gpt", "value": "[(0.369, 0.784)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66446427b57b1f4a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a fashion designer analyzing the image. You need to determine which shirt, the blue cotton shirt at center or the brown textured shirt at center, has a narrower width for designing a similar garment. Which one should you reference?" }, { "from": "gpt", "value": "The blue cotton shirt at center has a narrower width compared to the brown textured shirt at center, so you should reference the blue cotton shirt at center for designing a narrower garment." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1b5004212b6eee4.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton shirt at lower left positioned before brown cotton shirt at center?" }, { "from": "gpt", "value": "Yes, white cotton shirt at lower left is in front of brown cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/001613b3cef96674.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of camouflage fabric robe at left in the image." }, { "from": "gpt", "value": "[(0.101, 0.477)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aaa1293f2fae5600.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.337, 0.819) positioned after point (0.599, 0.198)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ebb236e846f24ea1.jpg", "conversations": [ { "from": "human", "value": "\nPoint to brown mud at lower center.Point to the brown mud at lower center in the image." }, { "from": "gpt", "value": "[(0.715, 0.716)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26bb892485ec3b74.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, white textured fabric at upper right or white uniform at center?" }, { "from": "gpt", "value": "white uniform at center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9558699736d5f89.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, brown furry bear at center or fuzzy brown bear at center?" }, { "from": "gpt", "value": "fuzzy brown bear at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/002a0574cfd9f690.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.283, 0.452) closer to camera compared to point (0.972, 0.403)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.972, 0.403)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a613fdbe42a4c6e0.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the silver metallic necklace at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.543, 0.808)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bf422febb763b75.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point with coordinates point (0.519, 0.630). Looking around, you see a metallic orange airplane at center. What object is located exactly at your current position?" }, { "from": "gpt", "value": "The metallic orange airplane at center is located exactly at point (0.519, 0.630)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee31546e571ae16a.jpg", "conversations": [ { "from": "human", "value": "\nLocate the brown rough sweet potatoes at center in the image." }, { "from": "gpt", "value": "[(0.480, 0.787)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3a66dea8d437924.jpg", "conversations": [ { "from": "human", "value": "\nIs blue satin blouse at center taller than shiny metallic balloon at left?" }, { "from": "gpt", "value": "Yes, blue satin blouse at center is taller than shiny metallic balloon at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c586e54789f12f1b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.804, 0.570) or point (0.346, 0.542)?" }, { "from": "gpt", "value": "Point (0.346, 0.542)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e21d88e59f72dd95.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.231, 0.556) and camera?" }, { "from": "gpt", "value": "They are 6.90 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0838c8ec06762e16.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.606, 0.866) more distant than point (0.704, 0.514)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/121c72df3e6f8aa1.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.365, 0.484) behind point (0.453, 0.608)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e5945b60f0050f1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a clear shot of the black rubber pole at center without the glassy reflective skyscraper at left obstructing it. Based on their positions, is this possible?" }, { "from": "gpt", "value": "The glassy reflective skyscraper at left is positioned over the black rubber pole at center, so it would obstruct the view. To capture the pole clearly, you would need to adjust your angle or position to avoid the skyscraper." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99c89831e38019a4.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked by the coordinates point (0.590, 0.948) in the image. How far are you from the viewer?" }, { "from": "gpt", "value": "The distance between point (0.590, 0.948) and the viewer is 2.45 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ead45f5061a5b28.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.421, 0.848) more distant than point (0.406, 0.330)?" }, { "from": "gpt", "value": "Yes, point (0.421, 0.848) is behind point (0.406, 0.330)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0823c3da165d5e5.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of green grassy field at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.504, 0.784)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/020d49a8bbc0159d.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, matte orange safety vest at center or green hard hat at center?" }, { "from": "gpt", "value": "From the viewer's perspective, matte orange safety vest at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/203aec3694386c5d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black wooden building at center is taller than white fuzzy coat at lower left?" }, { "from": "gpt", "value": "Yes, black wooden building at center is taller than white fuzzy coat at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10f73f172dd24839.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.898, 0.919) in front of point (0.827, 0.961)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.827, 0.961)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0268c01e36e3857.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the scene. There is a point marked at coordinates point (0.306, 0.336). How far is this point from you in feet?" }, { "from": "gpt", "value": "The point (0.306, 0.336) is 9.63 feet away from you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/644685dc5f024d3c.jpg", "conversations": [ { "from": "human", "value": "\nPoint to black leather sandals at upper center.Point to the black leather sandals at upper center in the image." }, { "from": "gpt", "value": "[(0.665, 0.298)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e93e280659db3d2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the exhibition and need to adjust the lighting so that the blue textured sweater at upper left and the black plastic crt monitor at center are both visible. Since the sweater is taller than the monitor, which object might cast a shadow over the other if the light is placed above them?" }, { "from": "gpt", "value": "The blue textured sweater at upper left is taller than the black plastic crt monitor at center, so if the light is placed above them, the blue textured sweater at upper left would cast a shadow over the black plastic crt monitor at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39842d5b2636f429.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian standing on the gray asphalt path at center and want to approach the white matte shirt at center. Which direction should you move to reach them?" }, { "from": "gpt", "value": "The gray asphalt path at center is positioned on the right side of white matte shirt at center. To reach them, you should move to your left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2db779e1439f29b7.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.389, 0.728) and point (0.566, 0.616), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.389, 0.728) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c859a0b02882554.jpg", "conversations": [ { "from": "human", "value": "\nYou are an art conservator assessing the statue and spear in the image. You need to determine if the stone statue at center can be placed on a pedestal that is narrower than the smooth metal spear at upper left. Can it fit?" }, { "from": "gpt", "value": "The stone statue at center might be wider than the smooth metal spear at upper left, so if the pedestal is narrower than the spear, the statue may not fit properly. Further measurements are needed to confirm." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/529142fc84563f2e.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white printed blouse at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.537, 0.741)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf04a4a5a1e72325.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black leather jacket at center is positioned to the right of transparent glass at lower left?" }, { "from": "gpt", "value": "Yes, black leather jacket at center is to the right of transparent glass at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d00031eae3718dd0.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.591, 0.239) and camera." }, { "from": "gpt", "value": "They are 4.43 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/747996ac87080781.jpg", "conversations": [ { "from": "human", "value": "\nPoint to blue painted wood table at center.Point to the blue painted wood table at center in the image." }, { "from": "gpt", "value": "[(0.848, 0.717)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a57b68d8a3133d1a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room and want to take a photo of the green matte shirt at upper left. How far should you position yourself from the shirt to capture it clearly?" }, { "from": "gpt", "value": "The green matte shirt at upper left is 30.62 inches away from the camera, so you should position yourself approximately 30.62 inches away to capture it clearly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d53b88bf23179d6.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.290, 0.533) from camera?" }, { "from": "gpt", "value": "Point (0.290, 0.533) is 253.07 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cec381c9c65681fc.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the striped polo shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.472, 0.791)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b60656631cc51950.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.498, 0.697)?" }, { "from": "gpt", "value": "brown wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c70510caa867722d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to black chain-link fence at center.Point to the black chain-link fence at center in the image." }, { "from": "gpt", "value": "[(0.588, 0.684)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c9275268eaab6c2.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of dark gray sweatshirt at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.778, 0.573)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/048edd7aeebaa310.jpg", "conversations": [ { "from": "human", "value": "\nIn the image of the brainstorming session, there are two people wearing a black fabric shirt at center and a striped fabric shirt at right. Which one is positioned to the left?" }, { "from": "gpt", "value": "The black fabric shirt at center is positioned to the left of the striped fabric shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bcd1ff6ae6b54b9.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of dark gray leather jacket at right. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.918, 0.666)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/594faf8a1130e49e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian standing in front of the white glossy police car at center and the black plastic license plate at center. Which object is positioned to the right?" }, { "from": "gpt", "value": "The white glossy police car at center is positioned to the right of the black plastic license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5a287e1b59c8adc.jpg", "conversations": [ { "from": "human", "value": "\nIs dark blue shirt at upper left closer to camera compared to pink satin dress at center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86a63062be84059a.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between blue knitted hammock at center and wooden chair at center?" }, { "from": "gpt", "value": "blue knitted hammock at center is 1.45 meters away from wooden chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c773ee31088e3ca.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and want to capture a closeup of both the orange matte shirt at center and the teal satin dress at center in the same frame. Given that your camera has a minimum focusing distance of 2 meters, will you be able to achieve this without moving closer?" }, { "from": "gpt", "value": "The orange matte shirt at center is 2.28 meters away from the teal satin dress at center. Since the minimum focusing distance is 2 meters, the photographer can capture both in the same frame as the distance between them is sufficient." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9d17ff24137f50b.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.927, 0.602) and camera?" }, { "from": "gpt", "value": "They are 673.59 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6f97333153bd67e.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.056, 0.455) lie in front of point (0.266, 0.278)?" }, { "from": "gpt", "value": "Yes, point (0.056, 0.455) is in front of point (0.266, 0.278)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a37249bab714620.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.202, 0.725) behind point (0.622, 0.880)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d94e262db33e5c6e.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray concrete at lower left have a smaller size compared to brown fur mouse at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f9371240af271d2.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.978, 0.728) or (0.930, 0.966)?" }, { "from": "gpt", "value": "The point (0.978, 0.728) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1a93537e6204859.jpg", "conversations": [ { "from": "human", "value": "\nYou are a drone operator flying over the city. Your drone is currently above the dark gray concrete skyscraper at left and the smooth glass skyscraper at center. If you look downward, which skyscraper will appear larger in your camera view?" }, { "from": "gpt", "value": "The dark gray concrete skyscraper at left appears larger in the camera view because it is positioned closer to the drone than the smooth glass skyscraper at center, which is farther away." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/467a7fb4030a3e04.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.548, 0.281) and point (0.433, 0.756), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.433, 0.756) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0ed4765b606feb5.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the New York Stock Exchange and want to take a photo of the festive wreath with the large red bow. The wreath is located at point (0.392, 0.248). If you are currently 44.15 meters away from this point, is this distance too far to capture the wreath clearly in your photo?" }, { "from": "gpt", "value": "The point (0.392, 0.248) is 44.15 meters away from the camera. This distance might be too far to capture the festive wreath with the large red bow clearly in the photo, as most cameras require closer proximity for detailed shots of specific objects like wreaths." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78a4cdd0bf038cc7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray matte hoodie at center is shorter than black matte jacket at center?" }, { "from": "gpt", "value": "Correct, gray matte hoodie at center is not as tall as black matte jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afc626717057f0c5.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, blue striped shirt at right or shiny metallic drum at center?" }, { "from": "gpt", "value": "shiny metallic drum at center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9021c416411c937.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of brown rough bark tree at upper center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.745, 0.128)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b814776ddf001e0e.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of shiny silver bicycle at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.750, 0.648)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/111ff86d921fc932.jpg", "conversations": [ { "from": "human", "value": "\nDoes black lace dress at center lie in front of dark brown hair at upper right?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f59b3ccc1fd6636.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.700, 0.420) or (0.136, 0.922)?" }, { "from": "gpt", "value": "Point (0.136, 0.922)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/373b080c66398ab4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, matte white blouse at center or black plastic microphone at center, stands taller?" }, { "from": "gpt", "value": "Standing taller between the two is matte white blouse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/289bfd2ed980b7de.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the bridge and want to take a photo of the clear water at center and the gray concrete water at right. Which one should you focus on first if you want to capture both in the same frame?" }, { "from": "gpt", "value": "You should focus on the clear water at center first because it is closer to you than the gray concrete water at right, allowing both to be in the same frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db4cb18092bbb06d.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a green fabric jacket at center. Pinpoint a point to the green fabric jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.470, 0.527)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee6ee24f47a57ff3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.507, 0.898) or point (0.204, 0.267)?" }, { "from": "gpt", "value": "Positioned in front is point (0.507, 0.898)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abc65ad3229ff63c.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white wood chair at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.347, 0.897)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8155cbc8a31b47d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a maintenance worker needing to reach the dark gray stone clock at upper right from the brick textured clock tower at upper right. Given that your ladder can extend up to 40 feet, will you be able to reach the clock without moving the ladder?" }, { "from": "gpt", "value": "The distance between the brick textured clock tower at upper right and the dark gray stone clock at upper right is 41.45 feet. Since your ladder only extends to 40 feet, you will not be able to reach the clock without moving the ladder." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f81b6918543feaee.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is white steam at center from camera?" }, { "from": "gpt", "value": "The distance of white steam at center from camera is 68.68 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c85449056624525e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, black matte glove at center or matte black leather jacket at center?" }, { "from": "gpt", "value": "black matte glove at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ccd0040ae4eef3e.jpg", "conversations": [ { "from": "human", "value": "\nIs american flag tablecloth at center wider than pink plaid shirt at right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bc768c4d56ef1cb.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.649, 0.605) come in front of point (0.953, 0.056)?" }, { "from": "gpt", "value": "Yes, point (0.649, 0.605) is in front of point (0.953, 0.056)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d793e776f311f7ac.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, curly hair at upper right or dark gray hoodie at center, stands taller?" }, { "from": "gpt", "value": "Standing taller between the two is curly hair at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/931ea93b711e5339.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of smooth skin man at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.661, 0.598)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dea24b687bb81548.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a group photo of the children at the Halloween party. You notice the light blue shirt at center and the striped sweater at left. Which child should you ask to stand up slightly to ensure both are visible in the photo?" }, { "from": "gpt", "value": "The striped sweater at left should be asked to stand up since the light blue shirt at center is already taller, ensuring both can be seen clearly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ae845d200a50103.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the waterfall in the image and want to place a small statue on the green mossy log at lower center. The coordinates given are point (0.628, 0.908). Can you confirm if this point is indeed where the green mossy log is located?" }, { "from": "gpt", "value": "Yes, according to the provided coordinates, point (0.628, 0.908) corresponds to the green mossy log at lower center, so placing the statue there would be accurate." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/077e7164ba6098ad.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.638, 0.600) and point (0.669, 0.659), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.638, 0.600) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbeeb8f84321182c.jpg", "conversations": [ { "from": "human", "value": "\nIs glossy dark brown car at center wider than matte silver car at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c7c0569f179c1c7.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, brown woolen goat at center or light brown fur monkey at right?" }, { "from": "gpt", "value": "From the viewer's perspective, brown woolen goat at center appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e516788cf70011f9.jpg", "conversations": [ { "from": "human", "value": "\nIs brown wooden logs at lower left to the left of rusty wood dock at lower left from the viewer's perspective?" }, { "from": "gpt", "value": "In fact, brown wooden logs at lower left is to the right of rusty wood dock at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de4575b669f76e4c.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist analyzing the Plastic Mullet Series. In the image, you see a brown matte eye at center and a matte gold eyebrow at upper center. Which object is taller?" }, { "from": "gpt", "value": "The brown matte eye at center has a greater height compared to the matte gold eyebrow at upper center, so the brown matte eye at center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e25872b4f328377.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white matte van at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.919, 0.186)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/325f226c5258773a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, smooth gray tree trunk at center or green leafy tree at center?" }, { "from": "gpt", "value": "smooth gray tree trunk at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/902b4546d90a29da.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, green leafy hedge at center or green lawn at center?" }, { "from": "gpt", "value": "Positioned to the left is green lawn at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81180badb831cd6f.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.937, 0.908) positioned after point (0.904, 0.484)?" }, { "from": "gpt", "value": "No, it is in front of (0.904, 0.484)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56ef014a3e61349b.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver who needs to park your 5.5 meter long truck near the yellow matte sign at center and the metallic silver sign at upper center. Can you park your truck between them without overlapping either sign?" }, { "from": "gpt", "value": "The distance between the yellow matte sign at center and the metallic silver sign at upper center is 17.61 meters, which is greater than the truck length of 5.5 meters. Therefore, the truck can be parked between them without overlapping either sign." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/186ac589d2078a10.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of smooth dark water at lower left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.124, 0.805)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c76bc9c288112535.jpg", "conversations": [ { "from": "human", "value": "\nIs black leather jacket at right bigger than dark blue shirt at left?" }, { "from": "gpt", "value": "Yes, black leather jacket at right is bigger than dark blue shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92dd1dd05d435333.jpg", "conversations": [ { "from": "human", "value": "\nYou are an aquatic plant enthusiast looking at the setup. You want to check the health of the green leafy plant at center without disturbing the smooth skin hand at right. Which object should you move first?" }, { "from": "gpt", "value": "The green leafy plant at center is in front of the smooth skin hand at right, so you should move the green leafy plant at center first to access the hand without causing disturbance." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76af3972166956da.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, white stone ruins at center or rusty stone pillar at left?" }, { "from": "gpt", "value": "Positioned lower is rusty stone pillar at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b6b27ccbbe701e4.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the orange smooth carrot at lower center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.663, 0.778)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/501c4fdc4adfea78.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.721, 0.589) or point (0.788, 0.048)?" }, { "from": "gpt", "value": "Point (0.721, 0.589) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1dfc22cb773f73bf.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth gray suit at left is positioned above shiny metallic shirt at center?" }, { "from": "gpt", "value": "Yes, smooth gray suit at left is above shiny metallic shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed2eb25d467cbba4.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between matte black guitar at left and camera." }, { "from": "gpt", "value": "The distance of matte black guitar at left from camera is 6.93 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfd71004109d0a66.jpg", "conversations": [ { "from": "human", "value": "\nIs green translucent water at lower left in front of brown cotton shirt at center?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7374aae50a93cd9e.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between green leafy shrub at center and camera." }, { "from": "gpt", "value": "They are 47.44 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a821f011a04f15f.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the light brown wood post at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.465, 0.545)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ce5ceaed6363e0e.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow waterproof jacket at right below yellow matte raincoat at center?" }, { "from": "gpt", "value": "Indeed, yellow waterproof jacket at right is positioned under yellow matte raincoat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6aace53a02255e7.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of green grassy at center in the image." }, { "from": "gpt", "value": "[(0.564, 0.772)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99c8e32bfa50dfc0.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.673, 0.758) to camera." }, { "from": "gpt", "value": "They are 3.23 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cea5f0be180dd91.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the sidewalk in the urban street scene and want to walk from the point at coordinates point (0.954, 0.713) to the point at coordinates point (0.442, 0.744). Which direction should you move to get closer to your destination?" }, { "from": "gpt", "value": "You should move forward because point (0.954, 0.713) is further to the viewer than point (0.442, 0.744), so moving forward will bring you closer to the destination point (0.442, 0.744)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50d66c5a90b8489f.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to smooth water at center? Please provide its 2D coordinates.Where can I find smooth water at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.483, 0.694)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81e32e4b93392b09.jpg", "conversations": [ { "from": "human", "value": "\nWhere is wooden canoe at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.612, 0.713)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ed7653dc4b2a1ae.jpg", "conversations": [ { "from": "human", "value": "\nIs matte khaki pants at center to the left of green matte shirt at center from the viewer's perspective?" }, { "from": "gpt", "value": "No, matte khaki pants at center is not to the left of green matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d9d6c05d074bd66.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a green concrete river at lower right. Pinpoint a point to the green concrete river at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.894, 0.633)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a54401ad6915e2d1.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the green painted wood bench at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.803, 0.806)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64f6d0a5053ab018.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.348, 0.531) or point (0.679, 0.691)?" }, { "from": "gpt", "value": "The point (0.679, 0.691) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00354cb2cbee36ac.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a shot of the pink quilted jacket at upper right without including the gray brick pavement at lower left in the frame. Based on their positions, is this possible?" }, { "from": "gpt", "value": "The pink quilted jacket at upper right is positioned over the gray brick pavement at lower left, so it is not possible to capture the jacket without including the pavement in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/396e72c1924838ea.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing on the road and want to capture both the silver metallic truck at center and the white cotton tank top at center in the same frame. Which object should you focus on first to ensure both are in the frame?" }, { "from": "gpt", "value": "The silver metallic truck at center is below the white cotton tank top at center, so you should focus on the white cotton tank top at center first to ensure both are in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d9618baf1cfe67e.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.750, 0.698) lie in front of point (0.935, 0.648)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4420c762bca551b8.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between yellow leaves at upper left and camera." }, { "from": "gpt", "value": "yellow leaves at upper left is 46.53 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7771fb447553205a.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.025, 0.273) behind point (0.688, 0.269)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/849eff99dc3b078f.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of brown sandy beach at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.498, 0.753)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/538b589e81fd3700.jpg", "conversations": [ { "from": "human", "value": "\nPoint to black plastic sign at center.Point to the black plastic sign at center in the image." }, { "from": "gpt", "value": "[(0.408, 0.591)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27baabcfb5607ddd.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.513, 0.723) or point (0.027, 0.716)?" }, { "from": "gpt", "value": "Positioned in front is point (0.027, 0.716)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d13e20136a09cd8.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in a fast food restaurant and see the three children. There is a point marked at coordinates (0.713, 0.902). How far is that point from you?" }, { "from": "gpt", "value": "The point at coordinates (0.713, 0.902) is 1.07 meters away from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa90c0a4c9d13db3.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the neon white laptop at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.577, 0.463)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7de215f9d99ed30f.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any wooden altar at center in the image." }, { "from": "gpt", "value": "[(0.634, 0.595)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99929dd59ce106ce.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point labeled point (0.575, 0.530) in the image. How far are you from the camera?" }, { "from": "gpt", "value": "The point labeled point (0.575, 0.530) is 1.79 meters away from the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3af0daaeb21341d4.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.570, 0.044) positioned in front of point (0.647, 0.853)?" }, { "from": "gpt", "value": "No, (0.570, 0.044) is behind (0.647, 0.853)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f7d8c29d54522bc.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of green leafy tree at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.292, 0.416)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec4429ced2e9c46d.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.515, 0.714)?" }, { "from": "gpt", "value": "mossy rock at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/179c5bb3691e7917.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from orange cotton shirt at center to camera." }, { "from": "gpt", "value": "orange cotton shirt at center and camera are 43.03 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08e87ee93d111bd8.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, blue cotton shirt at center or orange cotton shirt at lower left, stands taller?" }, { "from": "gpt", "value": "Standing taller between the two is blue cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd1a452f18ada23e.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the smooth orange juice at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.254, 0.217)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bbe3a4a2a4ff8025.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if soft plush baby at center is positioned to the right of velvety plush toy at upper right?" }, { "from": "gpt", "value": "In fact, soft plush baby at center is to the left of velvety plush toy at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c32b2e5391a105c5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte wood guitar at left is positioned to the left of brown smooth dog at lower center?" }, { "from": "gpt", "value": "Correct, you'll find matte wood guitar at left to the left of brown smooth dog at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b7781ca26113728.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green grassy hillside at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.455, 0.352)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba3fe489209b6569.jpg", "conversations": [ { "from": "human", "value": "\nLocate silhouette tree at upper right in the image." }, { "from": "gpt", "value": "[(0.741, 0.838)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c448a9187b510b1.jpg", "conversations": [ { "from": "human", "value": "\nYou are an astronomer observing the sky and notice the cloudy white at lower center and the black matte tree at lower right. Which object is positioned higher in the sky relative to the other?" }, { "from": "gpt", "value": "The cloudy white at lower center is located above the black matte tree at lower right, meaning it is positioned higher in the sky." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd04666ebddd6f9f.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.545, 0.709)?" }, { "from": "gpt", "value": "striped shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6415ed6e6e9341a6.jpg", "conversations": [ { "from": "human", "value": "\nYou are an outdoor photographer planning to capture a wide landscape shot. You have a camera with a 35mm lens that can capture a maximum width of 50 meters. The smooth gray mountain at center and the green matte tree at center are both in your frame. Based on their widths, will the mountain and tree fit within the lens width capacity?" }, { "from": "gpt", "value": "The smooth gray mountain at center is wider than the green matte tree at center. Since the mountain is wider, and the total combined width of both objects would exceed the 50 meters capacity of the 35mm lens, they might not fit within the lens width capacity. However, if the mountain alone is under 50 meters in width, it could fit. The exact width of each object isnecessary to determine this precisely." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2df89c27e531b11.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a photo of the shiny black car at center and the matte black top at center. Since both are black, you want to ensure you can distinguish them in your photo. Which object should you focus on to make sure it stands out more due to its size?" }, { "from": "gpt", "value": "The shiny black car at center is bigger than the matte black top at center, so focusing on the shiny black car at center will make it stand out more due to its larger size." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c7878488b9a352e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on a balcony and want to measure the distance from where you are to the concrete at lower left. What is the distance in meters?" }, { "from": "gpt", "value": "The distance between the concrete at lower left and the camera is 23.97 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56d46c8b7f1b9eb5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the Rainbow Runway 2010 fashion show. You need to capture a photo of the dark hair at lower right and the black silky dress at center. Which object will appear larger in the photo?" }, { "from": "gpt", "value": "The dark hair at lower right is smaller than the black silky dress at center, so the black silky dress at center will appear larger in the photo." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbc90d672efad0b7.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, red velvet curtain at upper center or matte black suit at center?" }, { "from": "gpt", "value": "Positioned to the left is red velvet curtain at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51a07cc1c18c7615.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the matte pink skirt at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.267, 0.453)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cd560590abe1544.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green leafy tree at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.551, 0.123)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02997bb046e76f53.jpg", "conversations": [ { "from": "human", "value": "\nLocate the brown stone fountain at center in the image." }, { "from": "gpt", "value": "[(0.855, 0.750)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df2a3d73603a9a6f.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point marked at coordinates (0.209, 0.884). Considering the paved area in the foreground, how far do you need to walk to get there?" }, { "from": "gpt", "value": "The point at coordinates (0.209, 0.884) is 101.29 feet away from the camera, so you need to walk 101.29 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21418bace9cbd398.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.458, 0.220) more distant than point (0.731, 0.491)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/428f760f2a53e4a4.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of smooth beige rock at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.190, 0.273)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7483c6ee06720a26.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.618, 0.611) or point (0.718, 0.611)?" }, { "from": "gpt", "value": "Point (0.618, 0.611)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efe9046fb15907e5.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown scaly lizard at center have a lesser height compared to smooth brown hand at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35098b82b09d24ad.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.481, 0.114) from the camera?" }, { "from": "gpt", "value": "A distance of 6.18 meters exists between point (0.481, 0.114) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d72c5ff653b0664.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the clear plastic screen door at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.503, 0.152)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70e54b7ff4f9019f.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic blue pole at center bigger than white snow pants at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3618a4f6400da1ee.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte cardboard poster at left located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.165, 0.566)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34659934300136e5.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the rectangular table in the meeting room. You want to place a new item at the point with coordinates point (0.072, 0.708). Where exactly on the table should you place it?" }, { "from": "gpt", "value": "The point (0.072, 0.708) is on the silver metallic laptop at left, so you should place the new item on top of the silver metallic laptop at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98b3e20c2e4899a4.jpg", "conversations": [ { "from": "human", "value": "\nHow much distance is there between reflective yellow vest at center and orange fabric at left?" }, { "from": "gpt", "value": "A distance of 13.51 meters exists between reflective yellow vest at center and orange fabric at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4835172bd29a3da6.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.501, 0.491) come in front of point (0.727, 0.409)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76a5549ad7d73a4c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room where the bulldog puppy is sitting. You want to place a small treat exactly at the point labeled as point (0.919, 0.352). If you are currently 1.62 meters away from that point, how far do you need to move forward to reach it?" }, { "from": "gpt", "value": "Since the point (0.919, 0.352) is 1.62 meters away from you, you need to move forward exactly 1.62 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f2eca9a895d4570.jpg", "conversations": [ { "from": "human", "value": "\nHow far is dried mud tree at center from camera?" }, { "from": "gpt", "value": "dried mud tree at center and camera are 3.12 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05af3097cdba0cc2.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the blue uniform at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.615, 0.589)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77a42219d0975f76.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of blue water at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.457, 0.681)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb77178ce7b034a4.jpg", "conversations": [ { "from": "human", "value": "\nIs orange cloth at center below matte blue shirt at upper left?" }, { "from": "gpt", "value": "Indeed, orange cloth at center is positioned under matte blue shirt at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/275fdbf5c8fc268b.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the black wood cross at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.283, 0.514)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/775652f14ed6fa58.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy hill at center appear on the right side of red fabric jacket at lower right?" }, { "from": "gpt", "value": "Yes, green leafy hill at center is to the right of red fabric jacket at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e95bffc7159678c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer adjusting the camera focus. The scene has a child in a striped sweater over a red shirt and an adult in a red jacket. Where is the matte red shirt at center located in relation to the point at coordinates (0.719, 0.623)?" }, { "from": "gpt", "value": "The matte red shirt at center is located exactly at the point with coordinates (0.719, 0.623)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5e10e02d4639c40.jpg", "conversations": [ { "from": "human", "value": "\nIs blue plaid shorts at upper right positioned in front of yellow matte shorts at center?" }, { "from": "gpt", "value": "Yes, blue plaid shorts at upper right is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f2ea5a60651a9d4.jpg", "conversations": [ { "from": "human", "value": "\nHow far is white glossy building at center from camera?" }, { "from": "gpt", "value": "They are 69.81 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85a0d4ea3aa41072.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the smooth concrete ledge at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.593, 0.877)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/559c9cc001ddd87e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a group photo of the black fabric suit at center and the brown leather jacket at upper right. Based on their positions, which one is more likely to be in the background?" }, { "from": "gpt", "value": "The brown leather jacket at upper right is more likely to be in the background because it is positioned higher up, which typically corresponds to a farther position in such settings." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2931b95f4566ff9b.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of light brown checkered shirt at right?" }, { "from": "gpt", "value": "2.59 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8487d3bdfd446648.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of blue cotton shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.497, 0.464)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60598449fd2a08ad.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, white matte shirt at center or white shirt at center?" }, { "from": "gpt", "value": "From the viewer's perspective, white matte shirt at center appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76b5092c6a1adb90.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.114, 0.727)?" }, { "from": "gpt", "value": "wooden desk at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63de6561a9efe53d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of white fluffy cloud at upper center in the image." }, { "from": "gpt", "value": "[(0.555, 0.470)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a98e3a69f7bbaae0.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is glossy red sedan at center from camera?" }, { "from": "gpt", "value": "glossy red sedan at center is 68.76 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5c5c0dda2eff51c.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the dull brown hillside at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.608, 0.303)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d32b4de23c47a59.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the matte gray rock at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.440, 0.378)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92ef2dde2e8f2dfd.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who has just found an owl sculpture in the forest. You want to place a small gift exactly halfway between the brown rough wood log at lower right and the brown textured owl at center. How far should you walk from the owl sculpture to reach the halfway point?" }, { "from": "gpt", "value": "The brown rough wood log at lower right is 5.89 feet away from the brown textured owl at center. To find the halfway point, divide the distance by 2, which is 2.945 feet. Walk approximately 2.95 feet away from the owl sculpture towards the brown rough wood log at lower right to place the gift halfway between them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/863ee8e1578f3bc0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black suit at center is shorter than black woolen sweater at center?" }, { "from": "gpt", "value": "No, black suit at center is not shorter than black woolen sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/517ffbb551a4e0ed.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the dark gray shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.495, 0.567)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56f139d8a8331c35.jpg", "conversations": [ { "from": "human", "value": "\nLocate matte silver monitor at left in the image." }, { "from": "gpt", "value": "[(0.265, 0.270)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0aeb370d71b98e74.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between yellow matte/tinted glass ferry at center and camera?" }, { "from": "gpt", "value": "yellow matte/tinted glass ferry at center and camera are 57.84 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/694301f91ceb5b2b.jpg", "conversations": [ { "from": "human", "value": "\nIs white marble statue at center taller than matte white statue at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b8366b4853b9f20.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green translucent water at center is positioned to the left of purple fabric boat at center?" }, { "from": "gpt", "value": "Yes, green translucent water at center is to the left of purple fabric boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a585b3e966db7984.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the matte black suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.724, 0.542)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc7ec3570c941040.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.291, 0.350) or (0.722, 0.747)?" }, { "from": "gpt", "value": "The point (0.722, 0.747) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cdc2cd2d3256ca6d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at a formal event. You need to capture a closeup shot of both the satin black dress at center and the bow tie at center in the same frame. The camera you are using has a minimum focus distance of 24 inches. Can you position yourself close enough to both objects to get them both in focus?" }, { "from": "gpt", "value": "The satin black dress at center and bow tie at center are 26.37 inches apart. Since the minimum focus distance is 24 inches, the photographer can position themselves within 24 inches from both objects to capture them in focus as the distance between them is greater than the minimum focus requirement." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6824907bb4c15052.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a closeup of the blue knitted scarf at center. According to the coordinates provided, where should you focus your camera lens?" }, { "from": "gpt", "value": "The blue knitted scarf at center is located at coordinates point (0.746, 0.627), so you should focus your camera lens there." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/035c7b162eb36689.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer adjusting your camera settings to focus on the white tulle dress at center and the dark blue leather jacket at lower right. Which object should you focus on first to ensure both are in sharp focus?" }, { "from": "gpt", "value": "The white tulle dress at center is closer to the viewer than the dark blue leather jacket at lower right, so focus on the white tulle dress at center first to ensure both are in sharp focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e50c03f4e8298894.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, gray woolen sweater at right or matte blue tie at left?" }, { "from": "gpt", "value": "gray woolen sweater at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0ec335d18c06e2a.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white matte sweater at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.553, 0.322)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d417d2630b4e407e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray matte whale at lower center is positioned to the right of green/yellow vest at upper center?" }, { "from": "gpt", "value": "In fact, gray matte whale at lower center is to the left of green/yellow vest at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9869f7beeb80d936.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black backpack at center come behind dark blue jacket at center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34eb4032eaf03672.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.202, 0.731) and camera." }, { "from": "gpt", "value": "Point (0.202, 0.731) is 2.07 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0efe488763264c47.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to reach the Honda sign on the building. You have a yellow matte bicycle at left and a matte gray shirt at left. Which object is closer to you if you are standing at the Honda sign?" }, { "from": "gpt", "value": "The yellow matte bicycle at left and matte gray shirt at left are 62.66 centimeters apart. Since you are standing at the Honda sign, the distance to both objects cannot be determined without additional information about their positions relative to the sign." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/999a2e4fe482a4d7.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.364, 0.661) and point (0.461, 0.411), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.461, 0.411) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e69a74d3a0581e6.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.695, 0.395)?" }, { "from": "gpt", "value": "curly red hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2360f7a30fcc7d70.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer holding a camera. You want to capture a closeup of the green glossy leaf at center. The camera is currently 3.70 feet away from the leaf. To get a better focus, you need to adjust the distance so that the leaf fills the frame without moving the leaf. Should you move closer or farther away?" }, { "from": "gpt", "value": "To get a better focus and fill the frame with the green glossy leaf at center, you should move closer because the camera is currently 3.70 feet away, which may be too far for a closeup. Moving closer would allow the leaf to take up more of the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ea69433cd4029ee.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink matte shirt at right have a greater height compared to white matte bag at center?" }, { "from": "gpt", "value": "Correct, pink matte shirt at right is much taller as white matte bag at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8669284d7418c0eb.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the playground and looking towards the multi level structure. There is a point marked at coordinates (0.807, 0.672). Which object does this point correspond to?" }, { "from": "gpt", "value": "The point corresponds to the beige plastic slide at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb37ad928c589283.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach point (0.911, 0.811). Is the distance more than 30 inches?" }, { "from": "gpt", "value": "The distance between the camera and point (0.911, 0.811) is 30.76 inches, so yes, it is more than 30 inches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8219236525579fb.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to enter the Barnes and Noble Bookstore. You have a tall package that is 2 meters in height. You are standing in the parking lot and see the silver metallic suv at lower left and the matte gray sedan at lower left. Which vehicle can you park closer to the entrance without worrying about the height restriction of the bookstore entrance?" }, { "from": "gpt", "value": "The silver metallic suv at lower left has a greater height compared to matte gray sedan at lower left. Since the package is 2 meters tall, parking closer to the entrance would be safer near the matte gray sedan at lower left, as the lower vehicle height reduces the risk of hitting the entrance with the tall package." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb88d1cebead1fc7.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of green plastic house at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.565, 0.645)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/badf0d36388c2cb2.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the wooden ladder at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.596, 0.408)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60b94446993dba0a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth skin man at center is smaller than brown skin boy at lower left?" }, { "from": "gpt", "value": "No, smooth skin man at center is not smaller than brown skin boy at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b27603532dcddf1b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.892, 0.819) or point (0.929, 0.748)?" }, { "from": "gpt", "value": "Point (0.929, 0.748)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbcee95500a095dd.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte canvas tarp at center is positioned to the left of smooth white shirt at center?" }, { "from": "gpt", "value": "Yes, matte canvas tarp at center is to the left of smooth white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddf56bc149c00fc6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point labeled as point (0.502, 0.758) in the image. Based on the scene description, what is the immediate terrain you are standing on?" }, { "from": "gpt", "value": "The point (0.502, 0.758) corresponds to the green grassy field at center, so you are standing on the green grassy field at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b146e0ff336a611.jpg", "conversations": [ { "from": "human", "value": "\nDoes white pebbles at center come in front of white plastic beach chair at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05c7be3caa4ab7b5.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, brown wooden deck at center or gray scaly crocodile at lower right?" }, { "from": "gpt", "value": "With less height is gray scaly crocodile at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0f85cf84c4e2f7f.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, green matte train car at center or rustic wood grain train car at right?" }, { "from": "gpt", "value": "green matte train car at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ac92d4b22aaad00.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.090, 0.152) or point (0.056, 0.936)?" }, { "from": "gpt", "value": "Positioned behind is point (0.090, 0.152)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9e7ff34bea73d64.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.788, 0.227) positioned after point (0.209, 0.192)?" }, { "from": "gpt", "value": "No, it is in front of (0.209, 0.192)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ddcd5eb7a131916.jpg", "conversations": [ { "from": "human", "value": "\nYou are a wildlife photographer observing the penguins. You need to capture a photo where both the black matte penguin at right and the black matte penguin at lower right are visible. Based on their positions, which penguin should you focus on first to ensure both are in frame?" }, { "from": "gpt", "value": "The black matte penguin at right is located above the black matte penguin at lower right, so focusing on the black matte penguin at right first will allow you to adjust the camera angle downward to include the black matte penguin at lower right in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2cf6fb277f772748.jpg", "conversations": [ { "from": "human", "value": "\nBetween leather pants at center and leather jacket at center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, leather jacket at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/772917833d7ded3e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.135, 0.739)?" }, { "from": "gpt", "value": "neon yellow mesh bag at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ae72393544ee2ee.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black suit at center appear on the left side of yellow satin tie at center?" }, { "from": "gpt", "value": "Yes, matte black suit at center is to the left of yellow satin tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5867447d9a1bfde.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.653, 0.744) closer to camera compared to point (0.161, 0.580)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.161, 0.580)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4261e85a9c80f25a.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth skin newborn at center behind smooth skin hand at center?" }, { "from": "gpt", "value": "No, smooth skin newborn at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d51d23d81a3ede34.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, metallic structure at center or metallic silver car at lower left?" }, { "from": "gpt", "value": "metallic silver car at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/049f9c5f957c3caa.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in the room and want to take a photo of the white fleece jacket at center. How far should you move forward or backward to ensure the jacket fills the camera frame properly?" }, { "from": "gpt", "value": "The white fleece jacket at center is 2.33 meters away from the viewer. To fill the camera frame properly, you should adjust your distance to approximately 2 meters, as most cameras require the subject to be within 2 meters for optimal framing." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfe16850636914a5.jpg", "conversations": [ { "from": "human", "value": "\nIs rusty wood table at center shorter than floral fabric shirt at center?" }, { "from": "gpt", "value": "Yes, rusty wood table at center is shorter than floral fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb577ca837a51777.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.799, 0.766) and point (0.579, 0.733), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.579, 0.733)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2909013ffe6564a.jpg", "conversations": [ { "from": "human", "value": "\nIs pink down jacket at center further to camera compared to black fuzzy glove at center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74ec6f2109bcbfbf.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of blue fabric life vest at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.610, 0.631)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5fd83f2b06eafbc.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.408, 0.797) or point (0.399, 0.520)?" }, { "from": "gpt", "value": "Point (0.399, 0.520)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7400295de5a2bb4.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.769, 0.803) or (0.033, 0.630)?" }, { "from": "gpt", "value": "The point (0.769, 0.803) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cf74ad9f07b5a25.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the gold shiny hat at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.553, 0.423)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1e89a8144298398.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between matte white crowd at center and camera?" }, { "from": "gpt", "value": "A distance of 13.27 meters exists between matte white crowd at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3de8e0854ebfbf11.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from dark blue t-shirt at center to camera." }, { "from": "gpt", "value": "They are 93.76 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a82ae02c179fa2e.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.727, 0.775) lie in front of point (0.381, 0.861)?" }, { "from": "gpt", "value": "No, it is behind (0.381, 0.861)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad78333ec5c9510f.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.002, 0.588) and point (0.583, 0.833), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.583, 0.833)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92af8a81550395c5.jpg", "conversations": [ { "from": "human", "value": "\nHow far apart are white cotton shirt at right and orange fabric at lower center?" }, { "from": "gpt", "value": "They are 4.95 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6442e439d4fcc30.jpg", "conversations": [ { "from": "human", "value": "\nBased on the scene description, where is the golden stone column at center located in terms of coordinates?" }, { "from": "gpt", "value": "The golden stone column at center is located at coordinates point (0.710, 0.528)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f36e44de01418799.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue shirt at center taller than black fur-lined coat at center?" }, { "from": "gpt", "value": "Yes, matte blue shirt at center is taller than black fur-lined coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30071f91c10122be.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of white matte projection screen at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.573, 0.284)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28979e27d31f0d63.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, pink fabric shirt at upper center or soft plush dinosaur at left?" }, { "from": "gpt", "value": "pink fabric shirt at upper center is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/490430d300bf2567.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the balcony and want to place a new plant pot between the two points labeled point (0.030, 0.734) and point (0.046, 0.566). Which point should the pot be closer to in order to be nearer to you?" }, { "from": "gpt", "value": "The pot should be closer to point (0.030, 0.734) because it is closer to the viewer than point (0.046, 0.566)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86967e682fc15c94.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.746, 0.552) or (0.076, 0.569)?" }, { "from": "gpt", "value": "The point (0.746, 0.552) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85db6990b4916947.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the cloudy white at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.449, 0.223)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58cc6887adf67ccf.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray pants at right appear on the left side of dark gray fabric pants at right?" }, { "from": "gpt", "value": "In fact, dark gray pants at right is to the right of dark gray fabric pants at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b040aae491d6b73e.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of neon green running shoes at center less distant than that of lavender soft fabric onesie at center?" }, { "from": "gpt", "value": "Yes, it is in front of lavender soft fabric onesie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5af06bbe833cc8eb.jpg", "conversations": [ { "from": "human", "value": "\nYou are an event planner organizing a photo shoot in the arena. You need to position a camera to capture both the patterned fabric jacket at center and the light beige wool coat at center. Based on their positions, which one should be placed closer to the camera to ensure both are in focus?" }, { "from": "gpt", "value": "The patterned fabric jacket at center is located below the light beige wool coat at center. To ensure both are in focus, the camera should be positioned so that the light beige wool coat at center is closer to the camera since it is above the jacket." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52b5428326adf564.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the beige concrete villa at center and want to walk towards the green grass at lower left. In which direction should you go?" }, { "from": "gpt", "value": "You should go to the left because the beige concrete villa at center is to the right of green grass at lower left, so moving left from the villa will lead you toward the grass." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9ad8d006c537d0a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown suede blazer at center is wider than black satin dress at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94eeb98e22a625d6.jpg", "conversations": [ { "from": "human", "value": "\nYou are a passenger on the vintage tram and want to sit as close as possible to the blue fleece jacket at center. Where should you sit?" }, { "from": "gpt", "value": "The blue fleece jacket at center is located at point 0.482 on the y axis, so you should sit in the seat closest to that coordinate to be as close as possible." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/216cd2abb9e90355.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.803, 0.580) from camera?" }, { "from": "gpt", "value": "Point (0.803, 0.580) is 50.26 centimeters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/657298ea21cec028.jpg", "conversations": [ { "from": "human", "value": "\nYou are a maintenance worker needing to walk from the fuel truck to the blue metallic airplane at center. According to the scene, which direction should you head relative to the smooth concrete tarmac at center?" }, { "from": "gpt", "value": "The smooth concrete tarmac at center is to the right of the blue metallic airplane at center, so to reach the airplane, you should head to the left of the smooth concrete tarmac at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d2e903cfa701896.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who wants to pick up the light brown sandal at center. How far do you need to walk to reach it?" }, { "from": "gpt", "value": "The light brown sandal at center is 47.14 meters away from the viewer, so you need to walk 47.14 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cd8aca02161f9ea.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the child in the image. You need to adjust your camera settings to focus on both the smooth skin face at center and the brown glossy eye at upper left. Considering their sizes, which object should you prioritize focusing on first?" }, { "from": "gpt", "value": "The smooth skin face at center is much taller than the brown glossy eye at upper left, so you should prioritize focusing on the smooth skin face at center first because it is larger and more prominent in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6dbcbef8acdc32a9.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of matte stone clock tower at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.455, 0.395)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a7849e51df4b3b6.jpg", "conversations": [ { "from": "human", "value": "\nCould you measure the distance between black fabric bag at center and black plastic goggles at center?" }, { "from": "gpt", "value": "22.10 centimeters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85f910358016e39b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the field and see the green grass at center and the wire at bottom. Which object is closer to your right side?" }, { "from": "gpt", "value": "The green grass at center is to the right of the wire at bottom, so the green grass at center is closer to your right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aea809129a4969c5.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.937, 0.923) or point (0.649, 0.977)?" }, { "from": "gpt", "value": "Point (0.937, 0.923)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/917899e3aee4c851.jpg", "conversations": [ { "from": "human", "value": "\nBetween clear water at center and gray metallic ship at center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "gray metallic ship at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0cce5203d083eeef.jpg", "conversations": [ { "from": "human", "value": "\nBetween brown shaggy dog at center and fuzzy beige dog at center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "brown shaggy dog at center is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e26fabc320c4b5da.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the park scene and want to take a photo of both the point at (0.977, 0.956) and the point at (0.028, 0.656). Which point should you focus on first to ensure both are in the same frame?" }, { "from": "gpt", "value": "You should focus on the point at (0.977, 0.956) first since it is closer to the camera than the point at (0.028, 0.656). This will help ensure both points are within the frame by starting with the closer one." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10d38c4ad54f7a87.jpg", "conversations": [ { "from": "human", "value": "\nYou are a museum curator examining the granite statue at center and the granite statue head at center. Which object is positioned higher in the image?" }, { "from": "gpt", "value": "The granite statue at center is positioned higher than the granite statue head at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/407652753dcfa604.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.485, 0.817) and camera?" }, { "from": "gpt", "value": "Point (0.485, 0.817) and camera are 46.75 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8de5a9de5de6da3a.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the black plastic keyboard at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.341, 0.497)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9aff21d804ba7019.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the child in the cornfield. Since the brown dry corn at center and the pink fabric dress at center are both at the center, which one is closer to the camera?" }, { "from": "gpt", "value": "The brown dry corn at center is above the pink fabric dress at center, so the corn is closer to the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e42194ac188ad03d.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.473, 0.570) less distant than point (0.335, 0.164)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/677b534b7add077d.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white soft fur puppy at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.523, 0.591)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/beb4995560188a5f.jpg", "conversations": [ { "from": "human", "value": "\nBased on the coordinates provided, which object is located at point (0.929, 0.181)?" }, { "from": "gpt", "value": "The brown leather jacket at upper center is located at point (0.929, 0.181)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a4aada22e3f2008.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.632, 0.662) or point (0.851, 0.758)?" }, { "from": "gpt", "value": "Point (0.632, 0.662) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b586d7bea7eb018.jpg", "conversations": [ { "from": "human", "value": "\nPoint to black matte pole at center.Point to the black matte pole at center in the image." }, { "from": "gpt", "value": "[(0.803, 0.586)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/518ba176acfb68f6.jpg", "conversations": [ { "from": "human", "value": "\nIs green smooth leaf at lower left taller than shiny blue butterfly at center?" }, { "from": "gpt", "value": "No, green smooth leaf at lower left is not taller than shiny blue butterfly at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/828c496dcdfe1cd4.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between matte black shirt at center and camera?" }, { "from": "gpt", "value": "They are 35.66 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/633ef81db1359bb4.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.830, 0.164) lie behind point (0.143, 0.216)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/daecd28ad4791320.jpg", "conversations": [ { "from": "human", "value": "\nDoes silky maroon shirt at center come in front of black silk scarf at left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e961a0b9dae1bc6.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.868, 0.631) and camera?" }, { "from": "gpt", "value": "They are 43.92 centimeters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5606d3af154a38a3.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who wants to cross the river using the smooth pebbles at center and the beige cotton shirt at center. Which object is larger in size and can provide a more stable footing for crossing?" }, { "from": "gpt", "value": "The smooth pebbles at center are larger in size than the beige cotton shirt at center, so they can provide a more stable footing for crossing." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e88bc772f4e6d1b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, black pinstripe suit at right or wooden table at center?" }, { "from": "gpt", "value": "Positioned higher is black pinstripe suit at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5adf9821963beb29.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.627, 0.433) and point (0.577, 0.519), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.577, 0.519)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ef4a7c17949d4cd.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.781, 0.541) closer to viewer compared to point (0.894, 0.608)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.894, 0.608)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/076977a903db8ca8.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of matte blue shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.489, 0.617)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e52ba7a5d398a98.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.454, 0.798) lie in front of point (0.497, 0.377)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d1ec2bcb76a9d80.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.497, 0.047) and point (0.386, 0.520), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.386, 0.520)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b69294ab8a72f74.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.479, 0.463) or point (0.456, 0.492)?" }, { "from": "gpt", "value": "The point (0.456, 0.492) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7d84a8bdc3736f9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.199, 0.562)?" }, { "from": "gpt", "value": "matte black blazer at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fab2e6cae6afcb9b.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from green leafy hill at center to camera." }, { "from": "gpt", "value": "They are 173.27 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fce350186446fef0.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of rusty metallic dinosaur at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.062, 0.216)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c23c859c898dda0.jpg", "conversations": [ { "from": "human", "value": "\nYou are a guest at this gathering and want to place a small vase between the pink fabric scarf at right and the white fluffy bread at lower center. Considering their sizes, which object should the vase be closer to?" }, { "from": "gpt", "value": "The pink fabric scarf at right is taller than the white fluffy bread at lower center. Therefore, the vase should be placed closer to the white fluffy bread at lower center to balance the height differences between the two objects." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/432b00db2395b8d2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.259, 0.814)?" }, { "from": "gpt", "value": "rusty wire mesh net at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ae6d5c6836372c4.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.986, 0.820) from camera?" }, { "from": "gpt", "value": "Point (0.986, 0.820) is 15.82 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef1e3641c0d83af7.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fabric canopy at upper center appear on the right side of dark blue coat at center?" }, { "from": "gpt", "value": "Indeed, white fabric canopy at upper center is positioned on the right side of dark blue coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf15be3215ecf490.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark wood/texture rocking horse at center is wider than wooden drawer at upper right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2975e310216c39f6.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the matte black wetsuit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.465, 0.533)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69b8dc8bafb3549c.jpg", "conversations": [ { "from": "human", "value": "\nBetween black matte shirt at left and white cotton shirt at center, which one is positioned higher?" }, { "from": "gpt", "value": "Positioned higher is black matte shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f43eeb9024d1a61.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between brown stone tower at center and camera?" }, { "from": "gpt", "value": "brown stone tower at center and camera are 51.52 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/270ecf3474ee14c5.jpg", "conversations": [ { "from": "human", "value": "\nYou are an ornithologist observing the winter landscape and want to note the positions of two features. Which object is positioned higher in the image, the green matte tree at upper left or the bare branches at upper center?" }, { "from": "gpt", "value": "The green matte tree at upper left is located above the bare branches at upper center, so it is positioned higher in the image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/009283c718d028f5.jpg", "conversations": [ { "from": "human", "value": "\nLocate blue water at right in the image." }, { "from": "gpt", "value": "[(0.977, 0.473)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fde35d77dd551a4.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the green leafy plant at right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.861, 0.364)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5555ea7e5cba431.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, clear glass window at center or matte glass window at upper center?" }, { "from": "gpt", "value": "Positioned lower is clear glass window at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84829f4dd752e8fc.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the modern architectural structure and notice two green leafy trees. Which tree, the green leafy tree at center or the green leafy tree at lower left, is positioned higher relative to the building?" }, { "from": "gpt", "value": "The green leafy tree at center is positioned higher relative to the building than the green leafy tree at lower left because it is above it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ceaa00ebc6a2309.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown glossy horse at center appear on the right side of shiny blue leotard at left?" }, { "from": "gpt", "value": "Indeed, brown glossy horse at center is positioned on the right side of shiny blue leotard at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8941dce1f1923871.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.314, 0.366) or (0.204, 0.527)?" }, { "from": "gpt", "value": "Positioned in front is point (0.314, 0.366)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3e44159a04898a8.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.419, 0.527) closer to viewer compared to point (0.613, 0.550)?" }, { "from": "gpt", "value": "Yes, point (0.419, 0.527) is in front of point (0.613, 0.550)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f2f1cd9fdea0a05.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.865, 0.419) more distant than point (0.188, 0.575)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f3079cf9de25abb.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of black satin blouse at center in the image." }, { "from": "gpt", "value": "[(0.515, 0.659)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5c987559d94f08b.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to white matte car at left? Please provide its 2D coordinates.Where can I find white matte car at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.086, 0.700)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d08b2b83001ca6a8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a group photo of the orange matte shirt at center and the matte orange hand at center. The camera you are using has a minimum focusing distance of 16 inches. Can you take a clear photo of both subjects without moving them?" }, { "from": "gpt", "value": "The distance between the orange matte shirt at center and the matte orange hand at center is 16.13 inches. Since the camera requires a minimum focusing distance of 16 inches, the 16.13 inches is just enough to capture both subjects clearly without moving them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0df85d60e034e5a2.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of green metallic lift truck at lower left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.512, 0.520)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07af3849c9d70dca.jpg", "conversations": [ { "from": "human", "value": "\nLocate blue matte shirt at center in the image." }, { "from": "gpt", "value": "[(0.613, 0.711)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7302e93d347589a.jpg", "conversations": [ { "from": "human", "value": "\nLocate all gray concrete crate at center in the image." }, { "from": "gpt", "value": "[(0.389, 0.669)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34e6250edc1c8d10.jpg", "conversations": [ { "from": "human", "value": "\nBetween metallic statue at upper center and white glossy boat at center, which one has less height?" }, { "from": "gpt", "value": "white glossy boat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ab468afbe32f273.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of green striped shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.440, 0.486)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99bff1b4f3638eb2.jpg", "conversations": [ { "from": "human", "value": "\nDoes translucent glass bowl of fruit salad at center have a lesser height compared to silver metallic spoon at center?" }, { "from": "gpt", "value": "Correct, translucent glass bowl of fruit salad at center is not as tall as silver metallic spoon at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2ce44c8ad639708.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.388, 0.569) to camera." }, { "from": "gpt", "value": "A distance of 236.69 feet exists between point (0.388, 0.569) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6050aac7f2baddc6.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.254, 0.477)?" }, { "from": "gpt", "value": "transparent glass window at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/102a1f99f91fdcfd.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, olive-green fabric coat at center or blue fuzzy beanie at center?" }, { "from": "gpt", "value": "blue fuzzy beanie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/574c7783be34af5d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to black plastic chair at upper center.Point to the black plastic chair at upper center in the image." }, { "from": "gpt", "value": "[(0.434, 0.194)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e869d1f8b1efdbf3.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the camera position. You want to take a photo of the white matte jersey at center. How far should you focus your camera lens to capture the jersey clearly?" }, { "from": "gpt", "value": "The white matte jersey at center is 32.99 feet from the camera, so you should focus your camera lens at 32.99 feet to capture it clearly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bf8eefd7e2aefc4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a candid shot of the matte pink pants at center and the matte pink leggings at center on the train station platform. Since both are at the center, which one would you focus on to ensure they are both in the frame without moving the camera? Explain your reasoning based on their spatial relationship." }, { "from": "gpt", "value": "The matte pink pants at center might be wider than the matte pink leggings at center, so focusing on the wider matte pink pants at center would ensure both are in the frame as the leggings are likely narrower and positioned within the same central area." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32369275f6630b28.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.143, 0.578) or point (0.304, 0.617)?" }, { "from": "gpt", "value": "Point (0.143, 0.578)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de1efba095d2a497.jpg", "conversations": [ { "from": "human", "value": "\nIs matte purple tank top at center wider than matte purple shirt at center?" }, { "from": "gpt", "value": "Yes, matte purple tank top at center is wider than matte purple shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e693d0227779fe5.jpg", "conversations": [ { "from": "human", "value": "\nIs spotted fur dog at lower right above yellow/black life vest at center?" }, { "from": "gpt", "value": "Incorrect, spotted fur dog at lower right is not positioned above yellow/black life vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1516b31ba5535a75.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer in a shop and want to buy the polished gold statue at center. The shopkeeper says that the statue is placed exactly at the center of the display. Is the shopkeeper telling the truth?" }, { "from": "gpt", "value": "The polished gold statue at center is located at point (0.572, 0.505), which is very close to the center coordinates of (0.500, 0.500). Therefore, the shopkeeper is telling the truth." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d74d539daad7e1a.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green fleece jacket at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.188, 0.588)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a6b684276f3cf59.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.823, 0.828) in the image, which is 92.30 feet away from you. You want to walk towards the rocky shoreline where the person is standing. How far do you need to walk to reach the shoreline?" }, { "from": "gpt", "value": "The distance of point (0.823, 0.828) from viewer is 92.30 feet, so you need to walk 92.30 feet to reach the shoreline." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a23a067b3eb8591.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of denim jacket at upper left less distant than that of white matte tablet at center?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cd672fe781bc060.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden plank hut at center below matte green dress at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ef6ff9a7ced8a8c.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of blue denim jacket at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.071, 0.697)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0f152a6b4fec188.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic silver frame at upper center thinner than brown wooden pole at center?" }, { "from": "gpt", "value": "Incorrect, metallic silver frame at upper center's width is not less than brown wooden pole at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2169439a264b837.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from natural wood handrail at center to camera." }, { "from": "gpt", "value": "The distance of natural wood handrail at center from camera is 6.56 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/818c55e29fb99bff.jpg", "conversations": [ { "from": "human", "value": "\nIs gray concrete picnic table at center smaller than green leafy tree at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22919e6aac209778.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.542, 0.689) positioned after point (0.784, 0.661)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bf68bf0fb022278.jpg", "conversations": [ { "from": "human", "value": "\nYou are a coach in a gymnasium. You need to retrieve the yellow jacket at right from the white leather fencing suit at center to give it to another athlete. Is the distance between them manageable for you to walk there and back without tiring?" }, { "from": "gpt", "value": "The distance between the white leather fencing suit at center and the yellow jacket at right is 6.27 meters. Walking this distance and back would total 12.54 meters, which is a short distance for a coach to manage without tiring." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44c879c3d707ff8d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up a tripod to capture the scene. You need to ensure that both the embroidered cotton dress at center and the green matte jacket at right are fully visible in the frame. Given their widths, which object requires a wider angle to accommodate its size?" }, { "from": "gpt", "value": "The embroidered cotton dress at center requires a wider angle because its width surpasses that of the green matte jacket at right, necessitating more space in the frame to fully capture it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae413ab3ede5a06e.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green leafy trees at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.503, 0.506)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f8e22780e650882.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark gray fleece jacket at lower right located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.777, 0.766)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cda6b1725f7f66f1.jpg", "conversations": [ { "from": "human", "value": "\nHow close is dark gray metallic car at center from camera?" }, { "from": "gpt", "value": "dark gray metallic car at center and camera are 43.24 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53c7fba519c54250.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if carrot puree at center is positioned above shiny red berries at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba08080bf21f6d52.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.027, 0.203) and camera?" }, { "from": "gpt", "value": "Point (0.027, 0.203) is 4.43 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/281d8523a6dbac64.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, matte white shirt at upper center or matte black hand at center?" }, { "from": "gpt", "value": "With less height is matte black hand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/339fa1f9ea348ae6.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.931, 0.917) come in front of point (0.276, 0.772)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.276, 0.772)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbb493ea2fd7234c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white matte t-shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.296, 0.597)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcee5630199c88c1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte shorts at center is positioned below shiny black car at center?" }, { "from": "gpt", "value": "Indeed, black matte shorts at center is positioned under shiny black car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c16eb7bb279a94ed.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any transparent glass table at lower left in the image." }, { "from": "gpt", "value": "[(0.192, 0.603)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/885bd98563820027.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.634, 0.575) more distant than point (0.300, 0.970)?" }, { "from": "gpt", "value": "No, (0.634, 0.575) is in front of (0.300, 0.970)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36c0cb89da6f795e.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of teal matte car at lower right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.959, 0.963)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fec28fb8ab5f5f30.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the rocky shoreline and want to reach the calm water at the center of the scene. Which object do you need to step over or around first, the transparent water at center or the gray gravel shoreline at center?" }, { "from": "gpt", "value": "You need to step over the gray gravel shoreline at center first because the transparent water at center is closer to the viewer, meaning the gray gravel shoreline is behind it and thus further away from your current position on the shoreline." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67843aa01c1aac14.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.605, 0.530) lie behind point (0.018, 0.709)?" }, { "from": "gpt", "value": "No, it is in front of (0.018, 0.709)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a87c8a0499ecacbf.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.467, 0.658)?" }, { "from": "gpt", "value": "matte black pen at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbb673a91f05647a.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of teal dotted fabric dress at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.629, 0.639)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f59a927aef76f19b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the scene and want to move from the point at coordinates point (0.839, 0.308) to the point at coordinates point (0.430, 0.530). Which direction should you move to get closer to the latter?" }, { "from": "gpt", "value": "To move from point (0.839, 0.308) to point (0.430, 0.530), you should move downward and to the right since point (0.430, 0.530) is closer to the viewer and positioned lower and to the right compared to point (0.839, 0.308)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bd12dc34067bd40.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer in the conference room. You need to take a photo of the dark gray suit at center and the floral fabric blouse at right. Based on their positions, which one should you focus on first to ensure both are in frame?" }, { "from": "gpt", "value": "The floral fabric blouse at right is located below the dark gray suit at center, so you should focus on the dark gray suit at center first to ensure both are in frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfc367fbd1242ddf.jpg", "conversations": [ { "from": "human", "value": "\nYou are an avatar in the winter scene and want to give a gift to both the matte black suit at left and the light yellow sweater at center. Since you have limited energy, you want to visit the closer one first. Which avatar should you approach first?" }, { "from": "gpt", "value": "The light yellow sweater at center is closer because the matte black suit at left has a larger size, so you should approach the light yellow sweater at center first." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43d3d802dd7acfd1.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of black metallic tripod at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.825, 0.745)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d82976cdb7461605.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.926, 0.881) from camera?" }, { "from": "gpt", "value": "Point (0.926, 0.881) is 15.89 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/237193932836bf40.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the pink matte fabric at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.670, 0.467)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd0719041905a489.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.344, 0.756) from camera?" }, { "from": "gpt", "value": "The distance of point (0.344, 0.756) from camera is 2.69 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a612a50dfd87494.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray textured shirt at lower left further to the viewer compared to dark blue jeans at lower center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c80570ebcbc73219.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.540, 0.136)?" }, { "from": "gpt", "value": "dark gray stone dome at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c8991437219a45c.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black shed at center have a lesser height compared to white matte suv at right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc5f0bad52d4d68d.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of light green cotton tank top at center?" }, { "from": "gpt", "value": "7.00 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0248e01ca87bd60f.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.742, 0.670)?" }, { "from": "gpt", "value": "brown quilted vest at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67fc1c7c99ad4303.jpg", "conversations": [ { "from": "human", "value": "\nIs black wool suit at center further to camera compared to black fabric uniform at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2aead897ff3646a2.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear water at center have a smaller size compared to striped fabric swimsuit at center?" }, { "from": "gpt", "value": "No, clear water at center is not smaller than striped fabric swimsuit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4213b82d668f366.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in a kitchen and need to reach a point marked at coordinates (0.203, 0.809). How far is this point from your current position?" }, { "from": "gpt", "value": "The point at coordinates (0.203, 0.809) is 4.66 feet away from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ecf3c1ddca92267b.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of snow-covered evergreen at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.555, 0.261)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffe807a8904ad308.jpg", "conversations": [ { "from": "human", "value": "\nHow close is point (0.621, 0.191) from camera?" }, { "from": "gpt", "value": "12.97 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2182cbede7e2ea54.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray pants at center appear on the left side of light brown leather jacket at upper right?" }, { "from": "gpt", "value": "Correct, you'll find dark gray pants at center to the left of light brown leather jacket at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7791149074ecc040.jpg", "conversations": [ { "from": "human", "value": "\nIs fluffy beige puppies at left below gray fluffy puppy at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4da4307b43eba6ef.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of gray checkered suit at lower center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.366, 0.898)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c604aa3e08652007.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.587, 0.434) in the image. How far are you from the viewer?" }, { "from": "gpt", "value": "The distance between point (0.587, 0.434) and the viewer is 4.61 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0e972d923f6b4b6.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of frosted white basket at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.569, 0.548)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7411c4fbef121218.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white cloth at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.740, 0.775)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/034d49b1ce980c26.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to place a rectangular package that measures 15 inches in length on the floor between the brown wooden table at left and the wooden chair at center. Based on the space available, will the package fit without overlapping either the table or the chair?" }, { "from": "gpt", "value": "The distance between the brown wooden table at left and the wooden chair at center is 14.75 inches. Since the package is 15 inches long, it will not fit entirely between them without overlapping either the table or the chair." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1713fb78da810c7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.192, 0.169)?" }, { "from": "gpt", "value": "white vapor at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c478e597495583bd.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.574, 0.391) or point (0.843, 0.627)?" }, { "from": "gpt", "value": "The point (0.574, 0.391) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c438c0d93c47046.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in front of the group in the dance studio. You want to take a photo that focuses on the black matte shirt at center and the blue cotton shirt at left. Which of these two shirts is closer to you?" }, { "from": "gpt", "value": "The black matte shirt at center is closer to you because it is further to the viewer than the blue cotton shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ab85e127c83b168.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red jacket at center positioned before metallic red car at left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f54c65bcc62772b3.jpg", "conversations": [ { "from": "human", "value": "\nLocate beige fleece jacket at center in the image." }, { "from": "gpt", "value": "[(0.491, 0.605)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab94e5c4300cb78c.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green leafy tree at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.482, 0.219)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e8bb6c5d03929c2.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.107, 0.369) or (0.151, 0.891)?" }, { "from": "gpt", "value": "Positioned behind is point (0.107, 0.369)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4d74ecdf1ff45a4.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point marked at coordinates (0.222, 0.825). How far do you need to walk in feet?" }, { "from": "gpt", "value": "The distance between the point marked at coordinates (0.222, 0.825) and the camera is 4.11 feet, so you need to walk 4.11 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/457947f1846b871e.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.786, 0.692) and camera?" }, { "from": "gpt", "value": "The distance of point (0.786, 0.692) from camera is 1.32 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e4b820f7076b84e.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the black uniform at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.826, 0.447)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4548ef145b8b1575.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the white painted parking line at lower center and want to walk to the white brick building at center. How far do you have to walk?" }, { "from": "gpt", "value": "The white brick building at center is 48.47 feet away from the white painted parking line at lower center, so you have to walk 48.47 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2b08920a0aabc5e.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.324, 0.006) and camera?" }, { "from": "gpt", "value": "Point (0.324, 0.006) is 2.00 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea14afe1da3ffd2d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if transparent plastic violin at right is positioned above matte silver trumpet at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33f1577c71adcff2.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.098, 0.628) or point (0.619, 0.303)?" }, { "from": "gpt", "value": "Point (0.619, 0.303)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c3266317a9a8c06.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the white cotton shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.931, 0.686)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c96d5d365e029c9f.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, green fabric jacket at center or black scarf at center?" }, { "from": "gpt", "value": "green fabric jacket at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9c154fda31dce50.jpg", "conversations": [ { "from": "human", "value": "\nIs black plastic computer at left to the left of white matte monitor at center from the viewer's perspective?" }, { "from": "gpt", "value": "No, black plastic computer at left is not to the left of white matte monitor at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50e3c2c9a1d1ef00.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of green matte shirt at center in the image." }, { "from": "gpt", "value": "[(0.727, 0.583)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcfe483ecfda9ee8.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of shiny blue helmet at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.597, 0.577)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3df0095168531103.jpg", "conversations": [ { "from": "human", "value": "\nHow far is green textured tree at right from camera?" }, { "from": "gpt", "value": "green textured tree at right is 17.51 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf2f27d4744484a3.jpg", "conversations": [ { "from": "human", "value": "\nWhere is plaid fabric shirt at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.525, 0.559)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5eee2139aab16af.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the black asphalt highway at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.498, 0.914)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8efc406e7f468800.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden table at center positioned behind velvet black jacket at upper right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59bbfa62d814d3f8.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to white fluffy cloud at upper center? Please provide its 2D coordinates.Where can I find white fluffy cloud at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.584, 0.359)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2543e1d12d670f1.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.296, 0.775) come in front of point (0.573, 0.758)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02a67618c5aeb75d.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue zip-up jacket at left shorter than gray/woolly beard at right?" }, { "from": "gpt", "value": "No, matte blue zip-up jacket at left is not shorter than gray/woolly beard at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5108716f567e1f9e.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown wooden bench at center have a greater width compared to knitted wool scarf at center?" }, { "from": "gpt", "value": "Yes, brown wooden bench at center is wider than knitted wool scarf at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ddf491c5f25d300.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny black bicycle at center is taller than matte black boat at left?" }, { "from": "gpt", "value": "Indeed, shiny black bicycle at center has a greater height compared to matte black boat at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b60854841843af3.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person with a cart that is 2 meters wide. You need to move through the space between the transparent glass door at center and the white plastic parking sign at upper left. Can your cart fit through the space between them?" }, { "from": "gpt", "value": "The transparent glass door at center and the white plastic parking sign at upper left are 2.50 meters apart from each other. Since your cart is 2 meters wide, it can fit through the space between them as the distance is greater than the cart width." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/521b3d6b1be1a94f.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte gray t-shirt at center and pink matte shirt at center, which one has more height?" }, { "from": "gpt", "value": "pink matte shirt at center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c83f9d08c10ae851.jpg", "conversations": [ { "from": "human", "value": "\nYou are an event planner arranging the layout for a presentation. You need to ensure that the matte black screen at left and the white marble statue at center are positioned correctly according to the venue guidelines. Based on the scene, which object is placed lower in the room?" }, { "from": "gpt", "value": "The matte black screen at left is placed lower in the room than the white marble statue at center because the matte black screen at left is below white marble statue at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/808c25137f6f7846.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.311, 0.830) positioned in front of point (0.350, 0.666)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c517937f33f7bbf0.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.823, 0.395) from the camera?" }, { "from": "gpt", "value": "Point (0.823, 0.395) is 3.36 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3bcc47df31a82b6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white fluffy snow at center is positioned to the left of brown leather jacket at center?" }, { "from": "gpt", "value": "No, white fluffy snow at center is not to the left of brown leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad9598b583cc7915.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between sandy beach at center and camera?" }, { "from": "gpt", "value": "sandy beach at center is 17.81 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b386a810cc763a6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the travel bags and want to place a small item on the point closer to you between point (0.574, 0.277) and point (0.266, 0.425). Which point should you choose?" }, { "from": "gpt", "value": "Point (0.574, 0.277) is in front of point (0.266, 0.425), so you should choose point (0.574, 0.277) as it is closer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/001871616f71eff1.jpg", "conversations": [ { "from": "human", "value": "\nWhat is located at the coordinates point (0.317, 0.597) in the image?" }, { "from": "gpt", "value": "The blue dotted shirt at center is located at point (0.317, 0.597)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/244be93a798ba9d2.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.930, 0.848) less distant than point (0.606, 0.097)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e06f975fc92f97d9.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.395, 0.938) from camera?" }, { "from": "gpt", "value": "11.75 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff21d052cc89af95.jpg", "conversations": [ { "from": "human", "value": "\nHow close is matte black robot at center from camera?" }, { "from": "gpt", "value": "They are 1.31 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44e8489215f4ed80.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the matte blue book at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.209, 0.219)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adf167d28b602b54.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.063, 0.814) and point (0.477, 0.717), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.477, 0.717)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdbb6d2ef098dedb.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton pillow at center closer to the viewer compared to crocheted white pillow at right?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5e7ae93f713025f.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.245, 0.334) and camera." }, { "from": "gpt", "value": "A distance of 6.66 feet exists between point (0.245, 0.334) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c44f551bea69d211.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.152, 0.430)?" }, { "from": "gpt", "value": "dark brown textured tree trunk at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f99170d94f6c23db.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the smooth brown water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.742, 0.939)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51568f5f8a94f2c5.jpg", "conversations": [ { "from": "human", "value": "\nHow close is green matte water at center from camera?" }, { "from": "gpt", "value": "3.98 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8b28712b9d1af0b.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at upper center positioned before blue matte mug at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d37e98425a90cff.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the polka dot glass at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.252, 0.731)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93b6b7e96f5109c4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white paper poster at upper center is positioned below dark gray hoodie at left?" }, { "from": "gpt", "value": "Correct, white paper poster at upper center is located below dark gray hoodie at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d168f6181fc00ee6.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte/deck bus at center positioned in front of white plastic license plate at center?" }, { "from": "gpt", "value": "Yes, it is in front of white plastic license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/916834929ebd0aa1.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the EUROA HOTEL and want to take a photo of the point at coordinates point (0.117, 0.803). If your camera has a maximum focus range of 35 meters, will you be able to capture it clearly?" }, { "from": "gpt", "value": "The point (0.117, 0.803) is 37.08 meters from the camera, which exceeds the camera maximum focus range of 35 meters. Therefore, the camera cannot capture it clearly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41f35d17dd7348e0.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.784, 0.664)?" }, { "from": "gpt", "value": "clear plastic vial at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73fefe262897ff8f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a family photo. You need to ensure the white cotton onesie at center and the white matte helmet at upper right are both visible in the frame. Based on their positions, which object is closer to the camera?" }, { "from": "gpt", "value": "The white cotton onesie at center is positioned under the white matte helmet at upper right, meaning it is closer to the camera than the helmet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d4db3252e03ffbf.jpg", "conversations": [ { "from": "human", "value": "\nYou are a visitor in the conference hall and see the matte orange shirt at left and the matte black backpack at left. Which object is closer to your right side?" }, { "from": "gpt", "value": "The matte orange shirt at left is closer to your right side since it is positioned to the right of the matte black backpack at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bac5eb1f68be2a84.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, blue fabric table at center or brown cotton shirt at center, stands taller?" }, { "from": "gpt", "value": "Standing taller between the two is brown cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/899db8821bc791ba.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue floral dress at center come in front of matte black suit at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c0dc22c1f515ce9.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, gray matte t-shirt at center or green matte t-shirt at left?" }, { "from": "gpt", "value": "gray matte t-shirt at center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00de75534bb096cd.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the left, matte gray shirt at center or matte black face paint at upper left?" }, { "from": "gpt", "value": "matte black face paint at upper left is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75f7cf498587f79c.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.230, 0.817) behind point (0.814, 0.478)?" }, { "from": "gpt", "value": "Yes, point (0.230, 0.817) is behind point (0.814, 0.478)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c3ceaa8c78e2dca.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room and want to place a small potted plant between the black polished stone pillar at right and the white cotton dress at center. Based on their positions, where should you place the plant?" }, { "from": "gpt", "value": "The black polished stone pillar at right is positioned on the right side of white cotton dress at center, so you should place the plant between them to the right of the white cotton dress at center and to the left of the black polished stone pillar at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01f2bdc7fd265e21.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of black printed fabric dress at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.805, 0.822)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1912dc129a993346.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.735, 0.422) or (0.495, 0.719)?" }, { "from": "gpt", "value": "Positioned in front is point (0.495, 0.719)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2418f003f9168d0.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist trying to paint the winter scene. You notice the white fluffy snow at center and the denim jeans at left. Which object should you paint first if you want to follow the rule of painting larger objects before smaller ones?" }, { "from": "gpt", "value": "You should paint the white fluffy snow at center first because it is larger than the denim jeans at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec0c1326fe68f8d6.jpg", "conversations": [ { "from": "human", "value": "\nBetween white glossy stairs at center and wooden stairs at center, which one is positioned higher?" }, { "from": "gpt", "value": "wooden stairs at center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22dfbb344c75cf8e.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of dark brown leather jacket at lower left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.156, 0.616)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56bff34fa9a23827.jpg", "conversations": [ { "from": "human", "value": "\nDoes speckled feathered rooster at center have a greater height compared to red fleece jacket at center?" }, { "from": "gpt", "value": "No, speckled feathered rooster at center is not taller than red fleece jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95efe216c017efa0.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the striped fabric sun visor at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.324, 0.700)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe4e7bbf6497d2f9.jpg", "conversations": [ { "from": "human", "value": "\nLocate the blue cotton shirt at right in the image." }, { "from": "gpt", "value": "[(0.787, 0.619)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e31ab5315f06dbb1.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of rasta-patterned dress at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.123, 0.348)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb035e6415f11632.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between brown sandy beach at lower center and white glossy boat at center." }, { "from": "gpt", "value": "They are 60.63 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d7354415f1a902c.jpg", "conversations": [ { "from": "human", "value": "\nHow far apart are brown tile roof hut at center and blue water at center?" }, { "from": "gpt", "value": "brown tile roof hut at center is 62.20 feet away from blue water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0b4e24dbc974901.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.765, 0.453)?" }, { "from": "gpt", "value": "matte red armchair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3af7fe7a20f21701.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.460, 0.567) come behind point (0.120, 0.511)?" }, { "from": "gpt", "value": "No, (0.460, 0.567) is in front of (0.120, 0.511)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63465af3c7061937.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if camouflage-patterned shorts at right is positioned above orange cotton shirt at upper center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bf36fc35f75f1ab.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver who needs to park your delivery van, which is 3.5 meters long, between the gray concrete curb at lower left and another curb. Can you fit your van there?" }, { "from": "gpt", "value": "The distance between the gray concrete curb at lower left and the other curb is 3.37 meters, which is shorter than your van length of 3.5 meters. Therefore, your van cannot fit in that space." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4547d84b86544907.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of black satin dress at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.790, 0.841)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13da3d9071b51d0b.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white mist at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.506, 0.227)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1aa1d788c77d15cf.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between matte skin hand at lower left and camera?" }, { "from": "gpt", "value": "30.22 inches" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee403d68bfb9f433.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist trying to capture the perfect shot of the blue neon sign at center and the bright white light at center. Based on their positions, which one should you focus on first if you want to frame them both from top to bottom?" }, { "from": "gpt", "value": "The blue neon sign at center is located above the bright white light at center, so you should focus on the blue neon sign at center first to frame them from top to bottom." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c24fecc9eb90b255.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between black silk suit at center and pinstriped suit at center." }, { "from": "gpt", "value": "The distance of black silk suit at center from pinstriped suit at center is 17.59 inches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bbe75b215aa3920.jpg", "conversations": [ { "from": "human", "value": "\nBetween shiny black sedan at center and metallic blue car at center, which one is positioned lower?" }, { "from": "gpt", "value": "metallic blue car at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6393c921a107d32a.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.566, 0.892) or (0.445, 0.850)?" }, { "from": "gpt", "value": "The point (0.566, 0.892) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1895afedf31d474e.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the green leafy tree at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.879, 0.416)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f06366908f508f61.jpg", "conversations": [ { "from": "human", "value": "\nYou are a chef preparing a dessert and need to place the red matte soy whip can at center and the metallic gold canister at center on a shelf that is 6 inches wide. Can both items fit side by side on the shelf without overlapping?" }, { "from": "gpt", "value": "The red matte soy whip can at center is 4.53 inches from the metallic gold canister at center. Since the total distance between them is less than the 6 inch shelf width, both items can fit side by side on the shelf without overlapping." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b8ae53adcf6d756.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is rusty metal mech at center from camera?" }, { "from": "gpt", "value": "rusty metal mech at center is 92.74 centimeters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e398690f41d71e0e.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown hair at upper center have a smaller size compared to matte black laptop at upper center?" }, { "from": "gpt", "value": "Yes, dark brown hair at upper center is smaller than matte black laptop at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f9ac77c0aba07f5.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the origin point of the image coordinate system. A white jersey at center is located at point (0.282, 0.448). If you move 0.1 units to the right along the x axis, will you be closer to or farther from the white jersey at center?" }, { "from": "gpt", "value": "Moving 0.1 units to the right along the x axis from the origin would take you to point 0.1, 0.0. The white jersey at center is at point (0.282, 0.448). The distance between the new position and the white jersey would be sqrt? 0.348 squared plus 0.282 squared, which is approximately sqrt? 0.121 plus 0.0795 equals sqrt? 0.1995, which is about 0.447 units. The original distance from the origin to the white jersey is sqrt? 0.448 squared plus 0.282 squared equals sqrt? 0.1995 plus 0.0795 equals sqrt? 0.279, which?" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ef199cc1e723c80.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.622, 0.916) and point (0.446, 0.184), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.446, 0.184) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c47b4b8cc576b55f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if satin black graduation gown at center is positioned below satin black gown at lower left?" }, { "from": "gpt", "value": "No, satin black graduation gown at center is not below satin black gown at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45458262a50efea8.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of green wool suit at center?" }, { "from": "gpt", "value": "A distance of 3.43 feet exists between green wool suit at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dadcad2fcfbc9552.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of transparent water at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.497, 0.733)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/675f11bb455bb59e.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the blue fabric shirt at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.079, 0.647)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5eca4017abda0516.jpg", "conversations": [ { "from": "human", "value": "\nWhere is plaid shirt at left located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.302, 0.362)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9dd940c2ab0147f6.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the event and want to take a photo of the black matte shirt at center. How far should you position yourself from the subject to capture it clearly?" }, { "from": "gpt", "value": "The black matte shirt at center is 1.32 meters away from the camera, so you should position yourself approximately 1.32 meters away to capture it clearly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35073170f34c7d0b.jpg", "conversations": [ { "from": "human", "value": "\nDoes rusty metal train track at lower left have a smaller size compared to black fur dog at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce2f22fa529f068b.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.794, 0.611) or (0.040, 0.617)?" }, { "from": "gpt", "value": "Positioned in front is point (0.040, 0.617)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0a1d3a15d676b33.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a group photo. You need to position yourself so that the mahogany wood table at lower left and the black matte blazer at center are both visible in your frame. Based on their positions, which object is closer to the camera?" }, { "from": "gpt", "value": "The black matte blazer at center is closer to the camera because the mahogany wood table at lower left is positioned under it, meaning the blazer is above and nearer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1096c7b0655086c8.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between blue striped fabric dress at center and light gray cotton pencil skirt at center." }, { "from": "gpt", "value": "They are 6.71 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc0d40f16c389530.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the red matte cable car at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.555, 0.692)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/510d192fc0689ff6.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the black pants at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.123, 0.189)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdf71d7fc9405319.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the outdoor scene described. There is a point labeled as point (0.452, 0.972). If you want to reach this point, how far do you need to walk?" }, { "from": "gpt", "value": "The point (0.452, 0.972) is 6.28 meters away from the viewer, so you need to walk 6.28 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/215d5c4c44f5394b.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.188, 0.216) to camera." }, { "from": "gpt", "value": "They are 1.71 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02ba60b431dd1cac.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.442, 0.652) closer to camera compared to point (0.971, 0.619)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/684bfd81cabd6352.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the scene without disturbing them. You need to place a small camera on either the black matte shirt at upper right or the soft white blanket at lower left. Which surface is closer to you so you can reach it easily?" }, { "from": "gpt", "value": "The black matte shirt at upper right is in front of the soft white blanket at lower left, so it is closer to you and easier to reach." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/439b26a06a80ad46.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a candid shot of the person with blonde hair at lower right and white checkered shorts at right. Since you want to ensure both subjects are in focus, which one should you focus on first to ensure proper depth of field?" }, { "from": "gpt", "value": "You should focus on the blonde hair at lower right first because it is closer to the camera than the white checkered shorts at right, ensuring proper depth of field for both subjects." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb23f8192c59ca8e.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green mossy roof at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.603, 0.123)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84e2febb4e779a55.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the scene of the playground. You notice the dark blue tank top at upper right and the tan skin girl at lower right. Which object should you focus on if you want to capture the larger subject in your photo?" }, { "from": "gpt", "value": "The tan skin girl at lower right is larger than the dark blue tank top at upper right, so you should focus on the tan skin girl at lower right to capture the larger subject in your photo." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06b778083c37003c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of a snow covered balcony looking at the white matte park bench at center. How far is the bench from you?" }, { "from": "gpt", "value": "The white matte park bench at center is 7.10 feet away from you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ea07e0a99e06467.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of brown fur coat at center in the image." }, { "from": "gpt", "value": "[(0.485, 0.762)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f70572e8b56a480.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.713, 0.512)?" }, { "from": "gpt", "value": "black suit at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a34e67af8334e909.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of dark blue uniform at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.183, 0.561)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a546714c705be06.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to park your van in the parking lot. You see the dark gray asphalt at lower right and the blue plastic license plate at lower right. Which one is closer to the ground?" }, { "from": "gpt", "value": "The dark gray asphalt at lower right is positioned under the blue plastic license plate at lower right, so the asphalt is closer to the ground." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d04f5f9598dc0b87.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer adjusting your camera settings to focus on the subject in the image. You notice the smooth skin face at center and the blue glossy eye at center. Which object should you focus on first if you want to ensure the subject looks sharp, and why?" }, { "from": "gpt", "value": "You should focus on the blue glossy eye at center first because it is closer to the camera than the smooth skin face at center. Focusing on the closer object ensures the subject appears sharp." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff675db43599a2de.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the tram station and want to board the matte orange train at left. According to the coordinates provided, where exactly should you go to board it?" }, { "from": "gpt", "value": "The matte orange train at left is located at coordinates point (0.168, 0.658), so you should go to that position to board it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66742893b87e2be9.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark blue shirt at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.430, 0.639)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49eb7eb784d1e91f.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of black matte shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.442, 0.683)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12c91ce223d8f7c6.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of purple plush monkey at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.278, 0.525)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e34f5df13ec998f3.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of multicolored fabric at center more distant than that of green matte blazer at left?" }, { "from": "gpt", "value": "No, it is in front of green matte blazer at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d126c0abb563c3d1.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of blue printed scarf at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.706, 0.667)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f7f2bdb030f637c.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the purple fabric shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.455, 0.644)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56c59ab59c438026.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.131, 0.706) closer to camera compared to point (0.107, 0.762)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b56092c89ed919d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to deliver a package to the address shown on the billboard. You see a woman with camouflage pants at center. Where should you approach her to ask for directions?" }, { "from": "gpt", "value": "You should approach the woman with camouflage pants at center at point (0.835, 0.580) to ask for directions." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd1d93f59d824f7d.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center positioned behind green grass at lower center?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c712932e39a93dbd.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.363, 0.786) closer to camera compared to point (0.675, 0.784)?" }, { "from": "gpt", "value": "No, it is behind (0.675, 0.784)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/721edfc43c3d503d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.543, 0.325) or point (0.676, 0.373)?" }, { "from": "gpt", "value": "Positioned behind is point (0.676, 0.373)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00a45acbc2ff6a1c.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the light skin strapless dress at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.754, 0.742)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0bfb0710cf32395.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between light blue cotton shirt at left and camera?" }, { "from": "gpt", "value": "light blue cotton shirt at left is 7.66 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48f1f4b205732ca2.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, dark blue sweatshirt at right or green leafy tree at center?" }, { "from": "gpt", "value": "From the viewer's perspective, dark blue sweatshirt at right appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ece461fca8c9fb6.jpg", "conversations": [ { "from": "human", "value": "\nHow close is cobblestone pavement at right from camera?" }, { "from": "gpt", "value": "The distance of cobblestone pavement at right from camera is 12.40 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a98336746cf55ec6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black glossy monitor at center is positioned to the right of matte silver lamp at left?" }, { "from": "gpt", "value": "Yes, black glossy monitor at center is to the right of matte silver lamp at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2c6566cbce6ece8.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.925, 0.083) or point (0.649, 0.061)?" }, { "from": "gpt", "value": "Point (0.649, 0.061) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c73a9eaf314ae445.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the blue fabric table at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.717, 0.558)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a31a55cfdcff779e.jpg", "conversations": [ { "from": "human", "value": "\nBetween velvet maroon dress at center and gold mesh crown at upper center, which one has more height?" }, { "from": "gpt", "value": "velvet maroon dress at center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/528f71637afa14d4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny plastic kayaks at center is positioned below transparent plastic water at lower center?" }, { "from": "gpt", "value": "Actually, shiny plastic kayaks at center is above transparent plastic water at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a32bda17bf47222e.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.187, 0.873)?" }, { "from": "gpt", "value": "dark gray sweater at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfb8ae93693633bb.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is matte black backpack at left from camera?" }, { "from": "gpt", "value": "matte black backpack at left is 5.32 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/470d87f6d26887f0.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist planning to sketch the scene from the park. You notice the bronze statue at center and the blue fabric jacket at center. Which object should you draw first if you want to capture the most prominent elements first?" }, { "from": "gpt", "value": "The bronze statue at center has a larger size compared to the blue fabric jacket at center, so you should draw the bronze statue at center first to capture the most prominent elements first." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79362d2be7ce0258.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of black matte dress at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.350, 0.572)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/483d31276c9630ec.jpg", "conversations": [ { "from": "human", "value": "\nYou are an inspector in this industrial facility and need to check the machinery. You notice two workers wearing the matte gray shirt at center and the black cotton shirt at center. Which worker is standing closer to the ground?" }, { "from": "gpt", "value": "The matte gray shirt at center is located below the black cotton shirt at center, so the worker wearing the matte gray shirt at center is standing closer to the ground." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36f8b8b9e7e06f54.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.058, 0.647)." }, { "from": "gpt", "value": "green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e08c9ad18006abeb.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.796, 0.653) and point (0.681, 0.603), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.681, 0.603) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a95e57a412726a4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green lawn at center is wider than green leafy tree at center?" }, { "from": "gpt", "value": "Yes, green lawn at center is wider than green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9fa725bb0808009.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of gray fabric shirt at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.404, 0.728)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/808a54ece13193d1.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of brown cardboard box at center-right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.825, 0.605)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d540279cb216d14b.jpg", "conversations": [ { "from": "human", "value": "\nBetween green leafy branch at upper right and green matte tree at lower left, which one has less height?" }, { "from": "gpt", "value": "With less height is green matte tree at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d221537e2ca0d0fb.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.538, 0.534)." }, { "from": "gpt", "value": "blue water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f080f7f69770b89.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between black matte speaker at left and matte black microphone at center." }, { "from": "gpt", "value": "The distance of black matte speaker at left from matte black microphone at center is 38.00 inches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/828a6c1a5cc5010e.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.770, 0.892) lie in front of point (0.942, 0.723)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb74d94688575aca.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green leafy tree at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.925, 0.892)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9c12bf8efa6edeb.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.364, 0.730) and camera?" }, { "from": "gpt", "value": "Point (0.364, 0.730) is 9.41 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d646161a5d61a26.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.939, 0.825) or point (0.636, 0.472)?" }, { "from": "gpt", "value": "Point (0.939, 0.825) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb6e35084eaa8f65.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of striped fabric dress at upper left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.214, 0.389)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0b1e8950861dab6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy boat at center is positioned above transparent water at lower left?" }, { "from": "gpt", "value": "Yes, white glossy boat at center is above transparent water at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8053ba4b1dbff6d7.jpg", "conversations": [ { "from": "human", "value": "\nIs light blue floral blouse at center below floral fabric blouse at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4f58756bf14e0c6.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black monitor at lower left have a greater height compared to satin silver laptop at center?" }, { "from": "gpt", "value": "Correct, matte black monitor at lower left is much taller as satin silver laptop at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6feca827b8b4709b.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.185, 0.537) and camera?" }, { "from": "gpt", "value": "Point (0.185, 0.537) and camera are 1.20 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe80700f120c8050.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.517, 0.622)?" }, { "from": "gpt", "value": "light gray cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/154d473eff6e6c96.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black jacket at left appear on the right side of matte gray jacket at left?" }, { "from": "gpt", "value": "Indeed, matte black jacket at left is positioned on the right side of matte gray jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1f823987d425d7e.jpg", "conversations": [ { "from": "human", "value": "\nPoint to green painted wood park bench at lower left.Point to the green painted wood park bench at lower left in the image." }, { "from": "gpt", "value": "[(0.253, 0.916)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e985e3e086243ff3.jpg", "conversations": [ { "from": "human", "value": "\nWhere is the white plastic laptop at center located in the image?" }, { "from": "gpt", "value": "The white plastic laptop at center is located at point coordinates of (0.294, 0.517)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9aa562693da5dd8f.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.725, 0.856) come in front of point (0.127, 0.820)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1286b14913603f01.jpg", "conversations": [ { "from": "human", "value": "\nYou are a nurse in the field hospital and need to quickly identify which staff member is closer to the patient for immediate assistance. Based on the uniforms, which staff member is positioned closer to the patient between the light beige uniform at right and the camouflage uniform at right?" }, { "from": "gpt", "value": "The light beige uniform at right has a smaller size compared to camouflage uniform at right, so the light beige uniform at right is positioned closer to the patient." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fd8d0f1a705c90a.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of matte floral dress at center in the image." }, { "from": "gpt", "value": "[(0.249, 0.572)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce119ae072338b84.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green matte jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.335, 0.545)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a41fb6aa8aad43a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, silvery reflective water at center or golden stone tower at center, stands taller?" }, { "from": "gpt", "value": "golden stone tower at center is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8eb94f4ba05d7a05.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.905, 0.236). What object is located exactly at this point?" }, { "from": "gpt", "value": "The point (0.905, 0.236) is where the green leafy tree at right is located." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91422828051de7c8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing in the middle of the group. You want to take a photo that includes both the blue checkered shirt at left and the metallic silver car at right. Can you position yourself so that both are in the frame without moving any objects? Explain your reasoning." }, { "from": "gpt", "value": "The blue checkered shirt at left and the metallic silver car at right are 4.33 meters apart. Since the photographer is in the middle of the group, they can likely position themselves to include both in the frame as 4.33 meters is a manageable distance for a standard camera lens to capture both subjects without needing to move objects." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b10f9025920a42fc.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.921, 0.795) and point (0.535, 0.956), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.535, 0.956) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80963842529a553e.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a matte blue shirt at center. Pinpoint a point to the matte blue shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.213, 0.578)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19ee366a9313fb35.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.253, 0.564) from camera?" }, { "from": "gpt", "value": "Point (0.253, 0.564) is 1.91 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98de11e5c5704941.jpg", "conversations": [ { "from": "human", "value": "\nBetween yellow matte shirt at center and light blue denim shorts at center, which one is positioned higher?" }, { "from": "gpt", "value": "light blue denim shorts at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f85b78b0049eefe5.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow metal railing at lower center lie behind teal glass railing at upper center?" }, { "from": "gpt", "value": "Yes, yellow metal railing at lower center is behind teal glass railing at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/991c4af57d1afdd4.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green grass at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.666, 0.923)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05a8ec1191fbd03f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, yellow fabric dress at center or yellow chiffon dress at center, stands shorter?" }, { "from": "gpt", "value": "yellow chiffon dress at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a76cc392d28e7877.jpg", "conversations": [ { "from": "human", "value": "\nYou are a bird flying over the urban landscape. You want to land on a higher spot between the green leafy tree at center and the orange autumn leaves at upper center. Which one should you choose?" }, { "from": "gpt", "value": "The green leafy tree at center has a greater height compared to the orange autumn leaves at upper center, so you should choose the green leafy tree at center to land on." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6918830abd9076aa.jpg", "conversations": [ { "from": "human", "value": "\nYou are a fashion designer observing the group and want to create a matching accessory for both the striped wool sweater at left and the yellow striped shirt at center. Considering their sizes, which one would require a larger accessory?" }, { "from": "gpt", "value": "The striped wool sweater at left requires a larger accessory because it has a larger size compared to the yellow striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1be9ef2aefd938b4.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to dark purple shirt at left? Please provide its 2D coordinates.Where can I find dark purple shirt at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.094, 0.717)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1dd37e4666d7f1fb.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, pink matte shirt at lower right or green matte shirt at center, stands taller?" }, { "from": "gpt", "value": "pink matte shirt at lower right is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1fce5772f062ca81.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to place a large package on the platform. The package is the size of the smooth concrete platform at center. Can you place the matte gray bag at left on top of the package without it falling off?" }, { "from": "gpt", "value": "The smooth concrete platform at center is larger in size than the matte gray bag at left, so placing the matte gray bag at left on top of the package would be stable since the package is bigger and can support it properly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c619d53a6dfd59a1.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.870, 0.969) or (0.702, 0.713)?" }, { "from": "gpt", "value": "Point (0.870, 0.969)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/792d977674dfc957.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the wooden deck and want to place a treat at the point with coordinates (0.274, 0.648). Which dog should you target to ensure the treat lands on its fur?" }, { "from": "gpt", "value": "The point with coordinates (0.274, 0.648) is on the brown and black fur dog at center, so you should target that dog to ensure the treat lands on its fur." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73e9615d1b13ee1d.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.273, 0.648)?" }, { "from": "gpt", "value": "plaid flannel shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5aee4fe66571574.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of rugged stone mountain at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.482, 0.652)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1b2ee7b5138fd39.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of stone/stained wood stairs at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.462, 0.802)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8def81279ecbc45c.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of floral dress at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.164, 0.719)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0b5625cce4833f2.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the matte red tank top at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.467, 0.705)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d1768979c1b17b7.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.843, 0.527) and point (0.572, 0.787), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.843, 0.527) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd964f4203e4375c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of wooden hut at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.915, 0.378)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6871bc7b2333b233.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the smooth white baby at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.558, 0.720)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11c70ae2252e3c59.jpg", "conversations": [ { "from": "human", "value": "\nLocate all black leather jacket at center in the image." }, { "from": "gpt", "value": "[(0.629, 0.473)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31cd1efcf277398a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper center is taller than smooth pink skin at lower center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65d6dee8761efb80.jpg", "conversations": [ { "from": "human", "value": "\nIs brown hair at left above multicolored beads at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f9c1d3ed9c4c5cd.jpg", "conversations": [ { "from": "human", "value": "\nBetween green grassy at center and brown wooden fence at lower left, which one has more height?" }, { "from": "gpt", "value": "brown wooden fence at lower left is taller." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2b19c1d8e790b01.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of silver metallic motorcycle at lower left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.227, 0.883)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95403448516aeb48.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the orange fabric jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.493, 0.730)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5eab51ca6b05ecba.jpg", "conversations": [ { "from": "human", "value": "\nLocate all black reflective sunglasses at center in the image." }, { "from": "gpt", "value": "[(0.583, 0.534)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0653144fa5240926.jpg", "conversations": [ { "from": "human", "value": "\nYou are driving a car and see the shiny black car at lower right and the red matte traffic light at center. Which object is closer to you?" }, { "from": "gpt", "value": "The shiny black car at lower right is closer to you than the red matte traffic light at center because the traffic light is positioned behind the car." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2ac622248b264ad.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of brown leather couch at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.448, 0.470)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7568b2eef61877b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room and want to place a small decorative item exactly halfway between point (0.512, 0.767) and point (0.754, 0.658). Given that the camera is positioned at the entrance, will the decorative item be closer to the camera or further away from it compared to the two points?" }, { "from": "gpt", "value": "The decorative item placed halfway between point (0.512, 0.767) and point (0.754, 0.658) will be closer to the camera than point (0.754, 0.658) but farther than point (0.512, 0.767). Since the average distance would be between the two, it won???t be closer to the camera than both points." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02e1ebce2c15b57e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the scene and want to hand a small item to the person wearing the gray cotton shirt at right. How far do you need to move forward to reach them?" }, { "from": "gpt", "value": "The gray cotton shirt at right and viewer are 6.47 feet apart, so you need to move forward approximately 6.47 feet to reach them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f02df85a4c66e467.jpg", "conversations": [ { "from": "human", "value": "\nYou are taking a photo of two people in a park. You notice the green cotton shirt at center and sunglasses at center. Which object is larger in the photo?" }, { "from": "gpt", "value": "The green cotton shirt at center is bigger than sunglasses at center in the photo." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a14fa3af5dcaebe.jpg", "conversations": [ { "from": "human", "value": "\nHow close is matte blue shirt at upper center from dark glass bottle at center?" }, { "from": "gpt", "value": "matte blue shirt at upper center and dark glass bottle at center are 4.37 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/480f85fccf0ca6c1.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of green glossy tile at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.512, 0.717)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08eea0b89215e90a.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a concrete at center. Pinpoint a point to the concrete at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.642, 0.850)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37064dd08fe33c9d.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.278, 0.900) and point (0.725, 0.978), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.278, 0.900) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe88795a83600318.jpg", "conversations": [ { "from": "human", "value": "\nDoes white paper at upper left have a larger size compared to white matte vest at center?" }, { "from": "gpt", "value": "Yes, white paper at upper left is bigger than white matte vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2495a5c49f48c64.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.580, 0.364) and camera?" }, { "from": "gpt", "value": "The distance of point (0.580, 0.364) from camera is 23.60 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/524f504dcbaf511b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the modern building and want to find the clear glass window at lower left. According to the scene description, where should you look relative to the exit sign on the wall?" }, { "from": "gpt", "value": "The clear glass window at lower left is located at point (0.108, 0.833), which is to the left side of the exit sign mounted on the wall." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8457b16691b8b1c8.jpg", "conversations": [ { "from": "human", "value": "\nYou are designing a new tablecloth for the table in the image. The table has a matte peach tank top at center and a silver metallic laptop at left. To ensure the tablecloth covers both items adequately, which item requires a larger portion of the tablecloth based on their widths?" }, { "from": "gpt", "value": "The matte peach tank top at center requires a larger portion of the tablecloth because its width is greater than the silver metallic laptop at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/caac3d6bb7290c7d.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position looking at the vast landscape. There is a point marked at coordinates (0.404, 0.231) in the image. How far is this point from your current position?" }, { "from": "gpt", "value": "The point at coordinates (0.404, 0.231) is 230.87 meters away from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65fd2245a26cd415.jpg", "conversations": [ { "from": "human", "value": "\nYou are a flight attendant who needs to move from the blue plaid shirt at center to the black fleece at right during a safety check. How much space do you need to navigate between them?" }, { "from": "gpt", "value": "The distance between the blue plaid shirt at center and the black fleece at right is 33.53 inches, so the flight attendant needs to navigate a space of approximately 33.53 inches to move between them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10a3f736167ee926.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer in the store and want to pick up the red fabric at upper right. Can you reach it without moving the black rubber snowshoes at center?" }, { "from": "gpt", "value": "The black rubber snowshoes at center is located below the red fabric at upper right, so you can reach the red fabric at upper right without moving the snowshoes since it is above them." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7e2808bfebfe383.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.495, 0.309)?" }, { "from": "gpt", "value": "brown corrugated metal roof at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbd3570799135986.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.409, 0.294)?" }, { "from": "gpt", "value": "black fabric jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/326e5562da2b55fc.jpg", "conversations": [ { "from": "human", "value": "\nIs plaid shirt at left below brown felt cowboy hat at left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d547acfb7a41f62.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the green textured hillside at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.517, 0.333)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87c71590204c80ca.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a group photo. You need to position yourself so that both the shiny black suit at center and the blue satin skirt at center are in focus. Which object should you focus on first to ensure both are sharp?" }, { "from": "gpt", "value": "You should focus on the shiny black suit at center first since it is closer to the viewer than the blue satin skirt at center. By focusing on the closer object, the depth of field will extend to include the farther object, ensuring both are in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd822ef358e016bf.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.402, 0.928) and camera." }, { "from": "gpt", "value": "The distance of point (0.402, 0.928) from camera is 9.92 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/519886becf2aa9ae.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue water at center have a greater height compared to blue matte boat at lower right?" }, { "from": "gpt", "value": "Indeed, dark blue water at center has a greater height compared to blue matte boat at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c5b7faf605828d0.jpg", "conversations": [ { "from": "human", "value": "\nYou are sitting in the front row of the lecture hall and notice the white matte projector screen at center and the brown hair at lower left. Which object is taller?" }, { "from": "gpt", "value": "The white matte projector screen at center is taller than the brown hair at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/226b9598f842ee8a.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of white cardboard boxes at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.692, 0.792)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e098aff0d0a6fbed.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the reddish-brown leaves at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.832, 0.216)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d364fa38078e141f.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of black leather jacket at center in the image." }, { "from": "gpt", "value": "[(0.386, 0.416)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/309940b9da248585.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between white plastic booth at center and camera." }, { "from": "gpt", "value": "36.55 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07ccc3cb986cc9f3.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and want to ensure both the black matte jacket at center and the dark blue jacket at center are fully visible in your photo. Which jacket should you focus on to avoid cropping the top of the taller one?" }, { "from": "gpt", "value": "The dark blue jacket at center is taller than the black matte jacket at center, so you should focus on ensuring the dark blue jacket at center is fully visible to avoid cropping the top." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c380a003c456dd1.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.506, 0.688) and point (0.377, 0.287), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.506, 0.688) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f99fb21a47f8e37.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of blue smooth shirt at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.507, 0.481)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4819cb23ae1b2f2f.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, yellow fabric costume at center or denim overalls at center?" }, { "from": "gpt", "value": "yellow fabric costume at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/447a67821d45904b.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte barbecue grill at center appear over brown curly fur dog at lower left?" }, { "from": "gpt", "value": "Correct, black matte barbecue grill at center is located above brown curly fur dog at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7c36c3907255082.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.118, 0.544) lie behind point (0.759, 0.655)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8dfc49b706a73ca3.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a black leather jacket at center. Pinpoint a point to the black leather jacket at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.350, 0.634)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/151a218e873ee6e4.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte helmet at center lie in front of white cotton shirt at lower right?" }, { "from": "gpt", "value": "Yes, white matte helmet at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71b14ad5b4ef7428.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, brown beard at center or brown matte hair at center?" }, { "from": "gpt", "value": "brown matte hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcba654904708068.jpg", "conversations": [ { "from": "human", "value": "\nIs metal chain-link fence at center shorter than green grass at lower center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca1091a0e58ef154.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.865, 0.642) or (0.295, 0.370)?" }, { "from": "gpt", "value": "Point (0.295, 0.370)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/115858733d377f69.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing next to the black matte jacket at lower left and want to take a photo of the metallic gray eiffel tower at center. If your camera has a maximum zoom range of 10 meters, will you be able to capture the entire eiffel tower in the photo without moving closer?" }, { "from": "gpt", "value": "The distance between the metallic gray eiffel tower at center and the black matte jacket at lower left is 36.42 meters. Since your camera can only zoom up to 10 meters, you won cannot capture the entire eiffel tower without moving closer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24dd5c7250294344.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.367, 0.456) come in front of point (0.546, 0.077)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.546, 0.077)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf732177320f6e10.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.969, 0.864) less distant than point (0.704, 0.912)?" }, { "from": "gpt", "value": "No, it is behind (0.704, 0.912)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5a9f6953b72b8b7.jpg", "conversations": [ { "from": "human", "value": "\nPoint to matte black dress at center.Point to the matte black dress at center in the image." }, { "from": "gpt", "value": "[(0.056, 0.283)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09861626a1cacc92.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who wants to place your blue fabric backpack at right and dark brown leather pants at lower left in a way that they are both visible from the front. Which object should you place first to ensure visibility?" }, { "from": "gpt", "value": "The dark brown leather pants at lower left should be placed first because the blue fabric backpack at right is positioned on the right side of it, meaning the backpack is further to the right and would not block the pants if placed correctly." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d00ed084adbed0c8.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the beach and want to find the clear blue water at lower center. According to the scene, where should you look relative to your position?" }, { "from": "gpt", "value": "The clear blue water at lower center is located at point (0.530, 0.881), so you should look towards the lower center direction from your current position on the beach." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3141cdb512d6e15c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver who needs to navigate around the construction area. You see the rusty metal road closed sign at center and the orange fabric barricade at lower left. Which object is located to the right of the other?" }, { "from": "gpt", "value": "The rusty metal road closed sign at center is positioned on the right side of orange fabric barricade at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3653df20fb816b5.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the matte red bar stool at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.813, 0.786)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8511f2d71dbc5e47.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the blue glossy tongue at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.326, 0.611)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed9373b02450eb1a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the gray water at center and want to walk to the nearest stone pier supporting the bridge. How far do you need to walk?" }, { "from": "gpt", "value": "The distance between the gray water at center and the viewer is 96.37 feet, so you need to walk 96.37 feet to reach the nearest stone pier supporting the bridge." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/becaeaa02f9e4069.jpg", "conversations": [ { "from": "human", "value": "\nIs gray cotton shirt at lower center wider than light blue t-shirt at center?" }, { "from": "gpt", "value": "In fact, gray cotton shirt at lower center might be narrower than light blue t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bad6b0f61f413f67.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.441, 0.234) come in front of point (0.949, 0.608)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98ff4d3e4e911e9d.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of cherry wood podium at left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.215, 0.725)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b957a4e4fc0d898.jpg", "conversations": [ { "from": "human", "value": "\nBetween bare branches at upper right and dark brown leather jacket at lower left, which one has less height?" }, { "from": "gpt", "value": "Standing shorter between the two is dark brown leather jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10c8f8ba84200928.jpg", "conversations": [ { "from": "human", "value": "\nLocate the black cotton t-shirt at center in the image." }, { "from": "gpt", "value": "[(0.736, 0.625)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a98773fd60f96669.jpg", "conversations": [ { "from": "human", "value": "\nLocate matte red shirt at center in the image." }, { "from": "gpt", "value": "[(0.472, 0.670)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35df82cf360cc181.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue suit at left bigger than dark gray suit at left?" }, { "from": "gpt", "value": "Correct, matte blue suit at left is larger in size than dark gray suit at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91c3fe5d3eb85e36.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is smooth concrete pavement at right from camera?" }, { "from": "gpt", "value": "smooth concrete pavement at right and camera are 4.16 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59c1320f75b1cb0a.jpg", "conversations": [ { "from": "human", "value": "\nLocate brown matte hardwood at left in the image." }, { "from": "gpt", "value": "[(0.208, 0.711)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52b333d4996de0a1.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, blue denim shorts at center or blue fabric shirt at right?" }, { "from": "gpt", "value": "blue fabric shirt at right is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff8594d0e730147c.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.723, 0.041) and point (0.072, 0.205), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.723, 0.041) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/862046f63f68d4ec.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, leather wristwatch at center or light brown fabric shirt at center?" }, { "from": "gpt", "value": "Standing taller between the two is light brown fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49c24a8ac4a14649.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and want to capture a candid shot of the man in the light gray suit. You notice the white silk tie at center and the matte black hand at center. Which object is closer to the camera in the image?" }, { "from": "gpt", "value": "The white silk tie at center is positioned over the matte black hand at center, so the white silk tie at center is closer to the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56f0cd99488e14c4.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the green leafy tree at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.217, 0.242)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23d60d6685be88fe.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and need to capture a photo where both the black satin tuxedo at center and the black lace dress at lower left are visible. Based on their positions, which one appears higher in the photo?" }, { "from": "gpt", "value": "The black satin tuxedo at center appears higher in the photo because it is positioned above the black lace dress at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27452f216087cef3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.075, 0.572) or point (0.465, 0.389)?" }, { "from": "gpt", "value": "Point (0.075, 0.572) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06c87db808ba2934.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position looking at the scene. There is a point marked at coordinates point (0.785, 0.922). How far is this point from where you are standing?" }, { "from": "gpt", "value": "The point (0.785, 0.922) is 7.36 meters away from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70733d2fc798a873.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer positioned at the edge of the equestrian arena. You want to capture a photo of the black leather jacket at center without the white wooden fence at lower center blocking the view. Is this possible given their positions?" }, { "from": "gpt", "value": "The black leather jacket at center is behind the white wooden fence at lower center, so the fence would block the view of the jacket. You cannot capture a clear photo of the black leather jacket at center without the fence obstructing it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d485f80251be469.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the brindle fur dog at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.755, 0.659)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0312462f3202e152.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the green evergreen tree at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.285, 0.309)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33357d27edefae81.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.550, 0.980) come behind point (0.203, 0.056)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f383f40ff1bd877f.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, blue fabric shirt at center or matte blue shirt at left?" }, { "from": "gpt", "value": "blue fabric shirt at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3aa9299cb9ad8968.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown dirt path at lower right is positioned below green grass at center?" }, { "from": "gpt", "value": "Indeed, brown dirt path at lower right is positioned under green grass at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d16b220e6f17f87f.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, glossy ceramic platter at lower left or translucent glass bowl at upper left?" }, { "from": "gpt", "value": "translucent glass bowl at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8b0453bb33dc122.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.523, 0.630)?" }, { "from": "gpt", "value": "matte gray tank top at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a150f7618fa2dc8.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, green matte shirt at upper center or green matte shirt at right?" }, { "from": "gpt", "value": "Positioned to the right is green matte shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0e3237dbb14ad56.jpg", "conversations": [ { "from": "human", "value": "\nYou are a museum visitor standing in front of the blue velvet robe at center. You want to take a photo of it without getting too close. If your camera has a maximum focus range of 2 meters, will you be able to capture a clear photo from your current position?" }, { "from": "gpt", "value": "The blue velvet robe at center is 1.92 meters away from the viewer. Since the camera can focus up to 2 meters, you can take a clear photo without moving closer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c1e97cee3a0b03a.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white fabric tent at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.368, 0.580)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5216fd43a9a7a58.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, wooden slats at right or peach matte pillar at left?" }, { "from": "gpt", "value": "wooden slats at right is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90da98633f6de72c.jpg", "conversations": [ { "from": "human", "value": "\nIs white smooth pillar at lower center to the left of yellow/yellowish paper at upper center from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, white smooth pillar at lower center is not on the left side of yellow/yellowish paper at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/532f547068c3a326.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.163, 0.428)?" }, { "from": "gpt", "value": "brown wooden railing at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28b7065fc204e728.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist planning to sketch the scene. You need to decide the size of your drawing paper. Based on the sizes of the bronze mickey mouse at center and the white shirt at lower left, which object should you allocate more space for on the paper?" }, { "from": "gpt", "value": "The bronze mickey mouse at center is smaller than the white shirt at lower left, so you should allocate more space for the white shirt at lower left on the paper since it is larger." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc9aae89ca315788.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance from maroon fleece jacket at center to matte gold helmet at upper center." }, { "from": "gpt", "value": "The distance of maroon fleece jacket at center from matte gold helmet at upper center is 3.50 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ca55485a0e6905f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a group photo of the family. You notice the multicolored beaded dress at center and the purple floral dress at left. Which dress should you position closer to the camera to ensure both are visible in the frame?" }, { "from": "gpt", "value": "The purple floral dress at left should be positioned closer to the camera because the multicolored beaded dress at center is already to the right of it, so moving the left one forward would keep both in view." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf453bc4a0031f73.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.840, 0.783) or point (0.446, 0.389)?" }, { "from": "gpt", "value": "The point (0.446, 0.389) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d70cd11927b33a5.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.828, 0.839) or (0.168, 0.831)?" }, { "from": "gpt", "value": "The point (0.168, 0.831) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df4449036bcd9a9b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position in the grand building. There is a point marked at coordinates point (0.324, 0.900). How far is that point from your current position?" }, { "from": "gpt", "value": "The point (0.324, 0.900) is 20.15 feet away from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22a4c0e6a7561c2d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a detailed shot of the smooth gray sweater at upper center and the smooth gray pants at center. Which object should you zoom in on to ensure it takes up more of the frame without moving the camera?" }, { "from": "gpt", "value": "The smooth gray sweater at upper center has a smaller size compared to smooth gray pants at center, so you should zoom in on the smooth gray pants at center to ensure it takes up more of the frame without moving the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bf6ae9c841ac9b8.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.780, 0.842) to camera." }, { "from": "gpt", "value": "31.47 inches" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c03c9697c7288f0e.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is beige leather armchair at lower right from transparent glass coffee table at center?" }, { "from": "gpt", "value": "A distance of 37.54 inches exists between beige leather armchair at lower right and transparent glass coffee table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b50fd7ec4fa8977e.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.464, 0.312) farther from viewer compared to point (0.510, 0.875)?" }, { "from": "gpt", "value": "Yes, point (0.464, 0.312) is farther from viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f73164bc0c4e680.jpg", "conversations": [ { "from": "human", "value": "\nHow close is worn fabric clothesline at center from smooth concrete pole at left?" }, { "from": "gpt", "value": "worn fabric clothesline at center is 5.26 meters from smooth concrete pole at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/918e7cab5c810c05.jpg", "conversations": [ { "from": "human", "value": "\nDoes black knit sweater at center appear on the right side of blue fabric poster at right?" }, { "from": "gpt", "value": "In fact, black knit sweater at center is to the left of blue fabric poster at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d2c98bc610257ba.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.067, 0.963) lie in front of point (0.052, 0.134)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.052, 0.134)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f125244914e2eda2.jpg", "conversations": [ { "from": "human", "value": "\nPoint to reflective fabric safety vest at center.Point to the reflective fabric safety vest at center in the image." }, { "from": "gpt", "value": "[(0.712, 0.630)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d5c2cc7a0ed5c8c.jpg", "conversations": [ { "from": "human", "value": "\nIs white fluffy snow at center closer to the viewer compared to green fabric shorts at center?" }, { "from": "gpt", "value": "Yes, white fluffy snow at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/300f0f3c5bfaee57.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green leafy tree at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.794, 0.328)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1845336219cff877.jpg", "conversations": [ { "from": "human", "value": "\nWhere is gold matte champagne bottle at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.244, 0.416)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/824187a86f40a1f8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if plaid cotton shirt at left is thinner than white cotton shirt at center?" }, { "from": "gpt", "value": "Yes, plaid cotton shirt at left is thinner than white cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3d87f2983d1f8dc.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the base of the cliff and want to reach the point marked at coordinates point (0.737, 0.895). How far do you need to travel to reach it?" }, { "from": "gpt", "value": "The point marked at coordinates point (0.737, 0.895) is 17.78 feet away from the viewer, so you need to travel 17.78 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00ba78775b5b3f6c.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte gray shirt at center and light brown leather jacket at upper left, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "light brown leather jacket at upper left is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/263720df594e567a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.619, 0.852)?" }, { "from": "gpt", "value": "plaid cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62c4c08a2f6f5b94.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the lace fabric sweater at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.582, 0.623)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7922ee2734594c68.jpg", "conversations": [ { "from": "human", "value": "\nLocate the brown wooden skeleton at center in the image." }, { "from": "gpt", "value": "[(0.485, 0.784)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b913a6bffa7bca32.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from shiny red cloth at center to camera." }, { "from": "gpt", "value": "They are 8.39 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3442f2aebdb5128c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked as point (0.516, 0.350) in the image. How far are you from the camera?" }, { "from": "gpt", "value": "The point marked as point (0.516, 0.350) is 5.35 meters away from the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/230f07c220cfbd6b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at center is taller than black asphalt road at center?" }, { "from": "gpt", "value": "Yes, green leafy tree at center is taller than black asphalt road at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63a6ff4cf1475f4b.jpg", "conversations": [ { "from": "human", "value": "\nBetween smooth concrete stairs at center and dark blue fabric jacket at lower center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "smooth concrete stairs at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdbe4a1a661e8da9.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the lace fabric dress at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.836, 0.556)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1501364fc484695f.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.783, 0.483) from camera?" }, { "from": "gpt", "value": "The distance of point (0.783, 0.483) from camera is 5.88 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6d7b6dff777b045.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.585, 0.231) in front of point (0.392, 0.178)?" }, { "from": "gpt", "value": "No, it is behind (0.392, 0.178)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4dab6f25b6aaef5b.jpg", "conversations": [ { "from": "human", "value": "\nPoint to white fluffy cloud at upper center.Point to the white fluffy cloud at upper center in the image." }, { "from": "gpt", "value": "[(0.508, 0.291)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c156496e8a647a8c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the building and want to walk towards the gray concrete pavement at lower left. According to the image, in which direction should you move relative to your current position?" }, { "from": "gpt", "value": "The gray concrete pavement at lower left is located at point (0.191, 0.812), so you should move towards the lower left direction from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4dd22580457b967.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the floral-patterned shirt at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.219, 0.345)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67b5a140f2a7f7c2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a group photo. You need to ensure that both the green cotton sweater at center and the knitted navy cardigan at right are clearly visible in the frame. Based on their positions, which clothing item might be partially obscured if they move closer to each other?" }, { "from": "gpt", "value": "The knitted navy cardigan at right is behind the green cotton sweater at center, so if they move closer, the knitted navy cardigan at right might be partially obscured by the green cotton sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdcd7398a668abdb.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of matte red tank top at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.284, 0.562)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04599538692e0fb9.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.306, 0.848) or (0.654, 0.537)?" }, { "from": "gpt", "value": "Point (0.306, 0.848) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2baad558d6d04c0.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the brown leafy tree at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.106, 0.347)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4d025e82e924976.jpg", "conversations": [ { "from": "human", "value": "\nWhere is metallic grill cart at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.417, 0.683)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72a8c9952ffb9f54.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is black leather earbud at upper right from matte skin ear at center?" }, { "from": "gpt", "value": "black leather earbud at upper right is 7.27 meters from matte skin ear at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f902edf371184222.jpg", "conversations": [ { "from": "human", "value": "\nDoes metallic blue bench at center have a greater height compared to metallic blue bench at right?" }, { "from": "gpt", "value": "Yes, metallic blue bench at center is taller than metallic blue bench at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3b0519001dcee0e.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the beach and want to wade into the clear water at lower center. How far do you have to walk to reach it?" }, { "from": "gpt", "value": "The clear water at lower center is 143.43 feet away from the viewer, so you would need to walk approximately 143.43 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/040ff9507de6998a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, bare branches at left or green coniferous tree at upper right?" }, { "from": "gpt", "value": "green coniferous tree at upper right is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/960705858f2fbd77.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.793, 0.500) or (0.697, 0.769)?" }, { "from": "gpt", "value": "The point (0.697, 0.769) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/407110f8918b741a.jpg", "conversations": [ { "from": "human", "value": "\nLocate all dark gray metallic skeleton at center in the image." }, { "from": "gpt", "value": "[(0.666, 0.534)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/160c2e20e9118a1a.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte white dress at center and smooth skin at center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "matte white dress at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e837d40265985e9a.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any striped sweater at right in the image." }, { "from": "gpt", "value": "[(0.938, 0.677)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce345b44b8e0ddd5.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the base of the castle walls and want to reach a specific point marked at coordinates point (0.362, 0.978). How far is this point from your current position?" }, { "from": "gpt", "value": "The distance of point (0.362, 0.978) from camera is 41.06 meters, so the point is 41.06 meters away from your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab947df94f5036ba.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, green fabric mask at center or green matte hair at center?" }, { "from": "gpt", "value": "From the viewer's perspective, green fabric mask at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc67cf41c9373265.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of black matte tank top at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.474, 0.634)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7dcb92de267d1ac.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.149, 0.306) and point (0.321, 0.886), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.149, 0.306)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dce8cbb1691c694f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing on the beach looking at the white matte sailboat at center and the clear water at center. Which object is closer to the camera?" }, { "from": "gpt", "value": "The white matte sailboat at center is above clear water at center, so it is closer to the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4daae63a6869e0e1.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing outside the hot tub and want to hand a towel to the person with blonde hair at right. Which direction should you move relative to the foamy white bath at center?" }, { "from": "gpt", "value": "You should move to the right of the foamy white bath at center to reach the blonde hair at right, since the blonde hair at right is located to the right of the foamy white bath at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec072ba7e42f1d88.jpg", "conversations": [ { "from": "human", "value": "\nIs white synthetic wig at center taller than smooth white wig at center?" }, { "from": "gpt", "value": "Yes, white synthetic wig at center is taller than smooth white wig at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0f0b9ed75a0d21b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the hotel lobby and want to approach the reception desk. If your current position is at the point marked by coordinates point (0.066, 0.498), how far do you need to walk to reach the reception desk?" }, { "from": "gpt", "value": "You need to walk 3.87 meters to reach the reception desk because the point (0.066, 0.498) is 3.87 meters away from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c403f3d3812870c7.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.247, 0.530) come closer to viewer compared to point (0.739, 0.528)?" }, { "from": "gpt", "value": "Yes, point (0.247, 0.530) is in front of point (0.739, 0.528)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0672908ded611de.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.953, 0.634) positioned behind point (0.998, 0.570)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1eac7f78a201cc5b.jpg", "conversations": [ { "from": "human", "value": "\nIs polished bronze horse at lower left above polished white pole at center?" }, { "from": "gpt", "value": "Actually, polished bronze horse at lower left is below polished white pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79ddc16945b7950d.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.165, 0.322) and point (0.896, 0.923), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.896, 0.923) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d89e3763eb065e8.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.615, 0.517) or point (0.223, 0.478)?" }, { "from": "gpt", "value": "Point (0.223, 0.478)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef49b0525ef30299.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the camera position. You want to take a photo of the green patinated bronze chariot at upper right. How far do you need to move forward or backward to get the chariot into the center of your photo?" }, { "from": "gpt", "value": "The green patinated bronze chariot at upper right is 96.60 meters from the camera. To center it in the photo, you would need to move forward or backward to adjust the framing, but the exact distance adjustment depends on the camera lens and desired composition. However, the chariot is already positioned at the upper right in the scene, so moving closer might bring it into the center while maintaining the monument structure in view." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84c247e776acaf32.jpg", "conversations": [ { "from": "human", "value": "\nLocate all faded denim jacket at lower right in the image." }, { "from": "gpt", "value": "[(0.088, 0.769)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04886579947a80c2.jpg", "conversations": [ { "from": "human", "value": "\nWhere is translucent orange and white butterfly at center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.685, 0.502)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5fe17c2ff2e2983.jpg", "conversations": [ { "from": "human", "value": "\nPoint to green matte apple at left.Point to the green matte apple at left in the image." }, { "from": "gpt", "value": "[(0.179, 0.592)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcd214ed475e3f53.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the dark blue water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.640, 0.778)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e4276c9c04ebafd.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is camouflagetextured fabric at left from black plastic goggles at upper left?" }, { "from": "gpt", "value": "A distance of 11.60 inches exists between camouflagetextured fabric at left and black plastic goggles at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba6c72f17f9d7cbe.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, reddish-orange hoodie at center or green matte jacket at center?" }, { "from": "gpt", "value": "reddish-orange hoodie at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64ecb6fab9d383f8.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the edge of the gathering area and want to hand a drink to both the light blue shirt at center and the matte blue shirt at center. If you can only carry one drink at a time, which person should you approach first to minimize the total distance walked?" }, { "from": "gpt", "value": "You should approach the light blue shirt at center first because it is closer to you than the matte blue shirt at center, so the total distance walked will be minimized." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6af22102f2db4a78.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.478, 0.642) or (0.459, 0.716)?" }, { "from": "gpt", "value": "Point (0.478, 0.642)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b4db98e11d7e24c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the point with coordinates (0.473, 0.828) in the image. What is the nearest object to you in the scene?" }, { "from": "gpt", "value": "The nearest object to you at point (0.473, 0.828) is the blue cotton shirt at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/695d6928f8f405c7.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect designing a new park layout. You need to place a new sculpture that is 3 meters tall. The park already has the black matte ship at center and the silhouette bronze statue at center. Considering their sizes, which existing object should the new sculpture be placed closer to to maintain visual balance?" }, { "from": "gpt", "value": "The new sculpture should be placed closer to the silhouette bronze statue at center because the black matte ship at center is larger in size than the silhouette bronze statue at center, so balancing with a smaller object would help maintain visual harmony." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51fe985d69b9be49.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to park your 1.8 meters tall package next to the wooden panel car at center and the metallic silver car at left. Which car should you place the package next to so it doesn" }, { "from": "gpt", "value": "The wooden panel car at center has a greater height compared to the metallic silver car at left. Therefore, you should place the package next to the wooden panel car at center since its height matches the package." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b74341a0bc11077c.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, white plastic lamp post at upper center or galvanized metal pole at center?" }, { "from": "gpt", "value": "galvanized metal pole at center is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b1d5ef7559a4006.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.591, 0.845) less distant than point (0.841, 0.689)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.841, 0.689)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c165da46fade675a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the wooden gate and want to take a photo of both horses. Which point should you focus on first to ensure both are in focus? The options are point A at coordinates point(0.062, 0.606) and point B at coordinates point(0.621, 0.505)." }, { "from": "gpt", "value": "Point A at coordinates point(0.062, 0.606) is closer to the camera than point B at coordinates point(0.621, 0.505). To ensure both are in focus, you should focus on the closer point first, which is point A." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3d8de2681a8ea64.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the rural outdoor scene and want to reach the rusty brown truck at left. How far do you need to walk to get there?" }, { "from": "gpt", "value": "The rusty brown truck at left is 4.02 meters away from you, so you need to walk 4.02 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/676efbd30b6ffdf0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white plastic table at center is shorter than metallic folding chair at center?" }, { "from": "gpt", "value": "Yes, white plastic table at center is shorter than metallic folding chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70bd2431f91d2c1c.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, matte black jacket at center or suede jacket at center?" }, { "from": "gpt", "value": "suede jacket at center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d52329c8803f1098.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic silver chairs at center is shorter than dark brown leather jacket at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d37b3d4ede082b7.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect examining the historic building. You need to determine if the white stone staircase at center can accommodate a large sculpture that requires a minimum width of 3 meters. Given that the smooth stone pillar at center is 2 meters wide, can the staircase potentially fit the sculpture?" }, { "from": "gpt", "value": "The white stone staircase at center might be wider than the smooth stone pillar at center, which is 2 meters wide. Therefore, it is possible that the staircase could accommodate the sculpture requiring 3 meters width, but further measurement is needed to confirm." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00627a11149243a2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear water at center is bigger than metallic blue cargo ship at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d71dce9b96abf957.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte green dress at center located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.542, 0.520)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/184cfb66b303b86a.jpg", "conversations": [ { "from": "human", "value": "\nLocate green marble table at center in the image." }, { "from": "gpt", "value": "[(0.234, 0.323)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8ed23199e2a99c3.jpg", "conversations": [ { "from": "human", "value": "\nWho is taller, blue textured dress at center or white cotton shorts at lower right?" }, { "from": "gpt", "value": "Standing taller between the two is blue textured dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0690d063bc559ec7.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.406, 0.122) positioned in front of point (0.132, 0.220)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/950d2a030a548404.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of brown paper bulletin board at center from blue striped shirt at center?" }, { "from": "gpt", "value": "brown paper bulletin board at center is 25.42 inches from blue striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/018d3b8f75ec8e49.jpg", "conversations": [ { "from": "human", "value": "\nDoes golden brown croissant at center have a smaller size compared to black poppy seed bagel at right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d624c600a08379e.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to black sweater at center? Please provide its 2D coordinates.Where can I find black sweater at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.258, 0.497)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3edb6721287b8140.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the asphalt parking lot at lower center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.475, 0.842)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46334d0b99dfa6e6.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.411, 0.308) lie behind point (0.631, 0.648)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6dbb8835efd203a4.jpg", "conversations": [ { "from": "human", "value": "\nBetween black beaded necklace at center and clear plastic glasses at center, which one is positioned lower?" }, { "from": "gpt", "value": "black beaded necklace at center is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0573aa166944ce2f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a ski equipment inspector checking the gear of a skier. You notice the shiny metallic ski at center and the purple matte ski goggles at center. Which item is shorter in height?" }, { "from": "gpt", "value": "The shiny metallic ski at center is not as tall as the purple matte ski goggles at center, so the shiny metallic ski at center is shorter in height." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c45dc1be6558f54.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.350, 0.686)?" }, { "from": "gpt", "value": "translucent brown water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9aa671fbd5d2c913.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white matte sculpture at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.240, 0.609)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97ac6d2b86397488.jpg", "conversations": [ { "from": "human", "value": "\nLocate green leafy tree at upper right in the image." }, { "from": "gpt", "value": "[(0.834, 0.192)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa99170a1eb9bc0b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.257, 0.544)?" }, { "from": "gpt", "value": "black metal window at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/926457ac3b70afad.jpg", "conversations": [ { "from": "human", "value": "\nYou are an observer standing in front of the scene. You notice the red velvet santa hat at upper left and the matte purple jacket at center. Which object is shorter in height?" }, { "from": "gpt", "value": "The red velvet santa hat at upper left has a lesser height compared to the matte purple jacket at center, so the red velvet santa hat at upper left is shorter in height." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a115f34dcd8b179b.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte shirt at lower left shorter than green matte shirt at right?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/250188f8d82d5d29.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.525, 0.856)?" }, { "from": "gpt", "value": "stone paved path at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e879aecedef5f1c.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of neon green shorts at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.377, 0.544)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7723b17770812485.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.074, 0.858) positioned behind point (0.365, 0.705)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/449fbdb61afd367e.jpg", "conversations": [ { "from": "human", "value": "\nLocate gray suit at center in the image." }, { "from": "gpt", "value": "[(0.785, 0.673)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18c815ef119ff9ab.jpg", "conversations": [ { "from": "human", "value": "\nYou are setting up a table for a dinner party and need to place a 15 cm tall candle holder between the transparent glass wine glass at center and the silver metallic spoon at lower left. Can the candle holder fit vertically between them without touching either object?" }, { "from": "gpt", "value": "The transparent glass wine glass at center is taller than the silver metallic spoon at lower left. Since the candle holder is 15 cm tall, it can fit vertically between them as long as there is enough horizontal space between the two objects to accommodate its base without touching either." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15d59650799a0910.jpg", "conversations": [ { "from": "human", "value": "\nYou are a parent trying to distract your baby. You see the denim overalls at center and the green plush toy at center. Which object is positioned to the right side?" }, { "from": "gpt", "value": "The denim overalls at center is to the right of the green plush toy at center, so the denim overalls at center is positioned to the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12594b1138961a19.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between green grassy field at center and camera?" }, { "from": "gpt", "value": "4.50 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8007ecf8875537a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy hillside at upper center is positioned to the right of white glossy boat at center?" }, { "from": "gpt", "value": "No, green leafy hillside at upper center is not to the right of white glossy boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7470503947ba3372.jpg", "conversations": [ { "from": "human", "value": "\nHow distant is denim jacket at center from matte black jacket at lower left?" }, { "from": "gpt", "value": "denim jacket at center is 5.86 meters away from matte black jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a032b3035613649.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny black table at center above black woven chair at center?" }, { "from": "gpt", "value": "Correct, shiny black table at center is located above black woven chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c43dec7c0269c5b7.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte bench at center positioned in front of smooth concrete pavement at center?" }, { "from": "gpt", "value": "Yes, green matte bench at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1253aafe4ec7d7e.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the metallic glass tower at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.937, 0.361)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce72257e02371b3a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, yellow larch tree at center or green matte tree at left, stands taller?" }, { "from": "gpt", "value": "green matte tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c6fcf77b1380a07.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.349, 0.092) or point (0.583, 0.508)?" }, { "from": "gpt", "value": "Positioned behind is point (0.583, 0.508)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5431c79147faac03.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver who needs to park your matte blue truck at center without covering the blue matte signboard at center. According to the scene, is this possible?" }, { "from": "gpt", "value": "The matte blue truck at center is positioned over blue matte signboard at center, so it is currently covering the signboard. To park without covering it, the truck must be moved to a different location where it doesn not overlap the signboard." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d1e12da90ab76ee.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the edge of the sidewalk, and you want to take a photo of the matte green bicycle at center. The camera you are using has a minimum focusing distance of 1.5 meters. Will the bicycle be in focus?" }, { "from": "gpt", "value": "The matte green bicycle at center is 1.64 meters away from camera, which is beyond the camera minimum focusing distance of 1.5 meters. Therefore, the bicycle will be in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c387011075f37fb.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a white stone clock tower at upper center. Pinpoint a point to the white stone clock tower at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.703, 0.670)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f5afde48693b256.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the beach and see the floral cotton skirt at upper right. How far away is it from you?" }, { "from": "gpt", "value": "The floral cotton skirt at upper right is 7.64 meters away from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c0131dd1e1227dd.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the natural wood planter at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.529, 0.561)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc1e80ad25c44329.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.426, 0.778)?" }, { "from": "gpt", "value": "brown soil at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/885e5d3a3ecef90a.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of pink blossoms at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.743, 0.819)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75ce249f23b88360.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.532, 0.566) or point (0.823, 0.548)?" }, { "from": "gpt", "value": "Point (0.823, 0.548) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ecee0e5cb704525e.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any dark brown hair at upper left in the image." }, { "from": "gpt", "value": "[(0.228, 0.542)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f06eed0bbd99ada8.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of gray woolen sweater at right. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.926, 0.728)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/187a782a582c4d77.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a charity event and need to decide which outfit to wear. You have a white satin tank top at center and a matte black dress at center. Based on their widths, which one would you choose if you want an outfit that is wider?" }, { "from": "gpt", "value": "The matte black dress at center is wider than the white satin tank top at center, so you should choose the matte black dress at center if you want a wider outfit." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db52f79948d94689.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.152, 0.427) or (0.914, 0.408)?" }, { "from": "gpt", "value": "Point (0.914, 0.408) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/882ec4c8e03d4ae7.jpg", "conversations": [ { "from": "human", "value": "\nYou are an architect analyzing the historical site. You notice the cloudy sky at upper center and the brown wooden fence at lower left. Which object occupies a larger horizontal space in the image?" }, { "from": "gpt", "value": "The cloudy sky at upper center might be wider than the brown wooden fence at lower left according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5c4cd5ad24a5a4d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a portrait session. You need to ensure that the black matte blazer at center and the white cloth at left are positioned so that the blazer is centered in the frame while the white cloth remains out of the main shot. Given their current positions, is this arrangement possible?" }, { "from": "gpt", "value": "The black matte blazer at center is to the right of the white cloth at left. Since the blazer is already positioned to the right of the white cloth, moving the blazer further to the center would require shifting it leftward, which might bring the white cloth into the frame. Therefore, achieving the desired arrangement may not be possible without adjusting the white cloth." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05c249011938631c.jpg", "conversations": [ { "from": "human", "value": "\nIs green fabric jacket at center above light brown leather jacket at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3475121736e71b2.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.660, 0.873) from camera?" }, { "from": "gpt", "value": "107.16 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf033df92c6a4eaf.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the leather skirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.301, 0.480)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09bb1f8c3bcbc4a2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person trying to park a truck that is 2 meters wide. You see a matte red car at lower left and a yellow matte car at lower left. Can you determine if there is enough space between them to park your truck?" }, { "from": "gpt", "value": "The matte red car at lower left might be wider than yellow matte car at lower left, so it is uncertain if there is enough space between them to park a 2 meter wide truck. Check the actual width before deciding." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05dd654b807985b0.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of brown and white fur goat at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.509, 0.334)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2614c29b97b0d5d.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric flag at right bigger than matte black suit at center?" }, { "from": "gpt", "value": "Actually, blue fabric flag at right might be smaller than matte black suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/213d97518944ebc1.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a white plastic toy car at lower center. Pinpoint a point to the white plastic toy car at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.402, 0.611)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5fa7a457b3d1ab7.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte church at center positioned at the back of green matte spire at upper center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8e71ca621c105c6.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.740, 0.450) farther from camera compared to point (0.474, 0.673)?" }, { "from": "gpt", "value": "No, it is in front of (0.474, 0.673)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c170173c547d6b16.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.873, 0.592) or point (0.407, 0.883)?" }, { "from": "gpt", "value": "Point (0.407, 0.883) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36d0014227ebafac.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of dark blue fabric at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.500, 0.756)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b52a5fe1c6ff758c.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.931, 0.648) farther from camera compared to point (0.581, 0.500)?" }, { "from": "gpt", "value": "No, it is in front of (0.581, 0.500)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d110ebb651e978d.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the silver metallic car at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.480, 0.863)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61b84c19def94702.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of plaid woolen jacket at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.294, 0.411)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c0832e018552847.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of brown textured tree at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.531, 0.266)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4947c6036bf75f18.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between rubberized red track at center and white fabric banner at upper center." }, { "from": "gpt", "value": "They are 23.03 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6153f9f9e7d31768.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.679, 0.902) come farther from viewer compared to point (0.465, 0.530)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.465, 0.530)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86a0057df2be606e.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the bare branches at upper right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.900, 0.434)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddaf3723ddff5bfe.jpg", "conversations": [ { "from": "human", "value": "\nLocate white plastic arrow at left in the image." }, { "from": "gpt", "value": "[(0.185, 0.328)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5922aa4fb0212d8f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gold satin curtain at upper center is positioned to the left of translucent glass window at center?" }, { "from": "gpt", "value": "Indeed, gold satin curtain at upper center is positioned on the left side of translucent glass window at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b45985111ea9d917.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a blue satin tablecloth at center. Pinpoint a point to the blue satin tablecloth at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.911, 0.978)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0351a0f6f75c911.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at center is wider than blue fleece sweatshirt at center?" }, { "from": "gpt", "value": "Indeed, green grass at center has a greater width compared to blue fleece sweatshirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/934b1b8999ca07fc.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a group photo of the blue striped shirt at right and the striped shirt at center. The camera you are using has a minimum focus distance of 50 centimeters. Will you be able to take the photo without moving any of the subjects?" }, { "from": "gpt", "value": "The blue striped shirt at right and the striped shirt at center are 47.04 centimeters apart. Since the minimum focus distance is 50 centimeters, the camera cannot focus properly. Therefore, you need to move the subjects closer to the camera or have them move slightly apart to meet the minimum distance requirement." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46596c36f6897e9d.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.124, 0.567) behind point (0.660, 0.733)?" }, { "from": "gpt", "value": "No, (0.124, 0.567) is in front of (0.660, 0.733)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33bdc7f22091570a.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.683, 0.250) come behind point (0.566, 0.655)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4573557c956f040.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.534, 0.973) behind point (0.292, 0.878)?" }, { "from": "gpt", "value": "No, it is in front of (0.292, 0.878)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b13bb9da393526f.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.997, 0.959) in front of point (0.438, 0.064)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.438, 0.064)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5de5e52c4d46ae06.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.968, 0.484) closer to viewer compared to point (0.429, 0.205)?" }, { "from": "gpt", "value": "No, (0.968, 0.484) is behind (0.429, 0.205)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f848a1ffa344809.jpg", "conversations": [ { "from": "human", "value": "\nBetween white smooth piglet at lower right and white smooth piglet at lower center, which one has more height?" }, { "from": "gpt", "value": "Standing taller between the two is white smooth piglet at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39f513c69b13cd86.jpg", "conversations": [ { "from": "human", "value": "\nCould you measure the distance between white fur cat at left and orange tabby cat at center?" }, { "from": "gpt", "value": "white fur cat at left is 25.35 inches from orange tabby cat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8316919431e01381.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the center of the mountain landscape and want to locate the cloudy sky at upper center. According to the coordinates provided, where exactly would you look?" }, { "from": "gpt", "value": "The cloudy sky at upper center is located at coordinates point (0.500, 0.244)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef52af43fd4d494f.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of floral silk kimono at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.390, 0.752)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d9c11d47bcd6a57.jpg", "conversations": [ { "from": "human", "value": "\nYou are a fashion designer observing the scene. You need to determine which clothing item is shorter between the matte white sweater at center and the matte gray shirt at upper left. Which one is shorter?" }, { "from": "gpt", "value": "The matte white sweater at center is shorter than the matte gray shirt at upper left according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e45154bfb4caef10.jpg", "conversations": [ { "from": "human", "value": "\nBetween light blue dotted tie at right and red woven tie at center, which one is positioned lower?" }, { "from": "gpt", "value": "light blue dotted tie at right is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc5d5b76a4d80bd6.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.801, 0.534) and point (0.156, 0.934), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.156, 0.934)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af5fea7f489a5ebf.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.522, 0.514) lie in front of point (0.530, 0.459)?" }, { "from": "gpt", "value": "No, it is behind (0.530, 0.459)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a67a37151b1a75c8.jpg", "conversations": [ { "from": "human", "value": "\nLocate all white matte bus at center in the image." }, { "from": "gpt", "value": "[(0.275, 0.403)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfcf8abbd468f376.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the white fleece sweatshirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.362, 0.608)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61d6f97a5014c192.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the brown woolen coat at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.622, 0.527)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21301c8e611c60a1.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of green grass field at center in the image." }, { "from": "gpt", "value": "[(0.474, 0.572)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d0b36fd9bdd79b4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a barista who needs to place a new cup on the wooden surface. The existing cup is on the saucer marked by point (0.705, 0.419). Where should you place the new cup to ensure it is not too close to the keyboard?" }, { "from": "gpt", "value": "Place the new cup on the wooden surface away from the white ceramic saucer at right marked by point (0.705, 0.419) to avoid proximity to the keyboard." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/108cbf856668490a.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.781, 0.497) positioned after point (0.494, 0.844)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a10fb71ade9b11c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to throw a small pebble to hit the point at coordinates (0.330, 0.569). How far do you need to throw it?" }, { "from": "gpt", "value": "The point at coordinates (0.330, 0.569) is 8.11 meters away from the camera, so you need to throw the pebble 8.11 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2622e8775555d77d.jpg", "conversations": [ { "from": "human", "value": "\nWho is higher up, smooth tan skin at center or brown wooden person at center?" }, { "from": "gpt", "value": "smooth tan skin at center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e428d633c07f5648.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery person who needs to place a package that is 2 meters long between the floral fabric ottoman at lower right and the matte wooden picture frame at upper center. Is there enough space to fit the package horizontally between these two objects?" }, { "from": "gpt", "value": "The distance between the floral fabric ottoman at lower right and the matte wooden picture frame at upper center is 3.58 meters. Since the package is 2 meters long, there is sufficient space to fit it horizontally between these two objects." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d06c0622c7e6f74e.jpg", "conversations": [ { "from": "human", "value": "\nYou are observing two points in the image. The first point is labeled as point (0.141, 0.916) and the second is point (0.041, 0.203). Based on their positions, which point is closer to the foreground of the scene?" }, { "from": "gpt", "value": "Point (0.041, 0.203) is closer to the foreground because it is in front of point (0.141, 0.916)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3969ceb261cd8f08.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.181, 0.938) or (0.071, 0.570)?" }, { "from": "gpt", "value": "Point (0.181, 0.938)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03e6151235c4becf.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a green leafy tree at upper center. Pinpoint a point to the green leafy tree at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.612, 0.322)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/773ef023c6cb4f2e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a security guard in the museum and need to ensure that visitors maintain a minimum distance of 6 feet apart for safety. You observe the gray pinstripe suit at left and dark gray suit at right. Are they complying with the social distancing guidelines?" }, { "from": "gpt", "value": "The distance between the gray pinstripe suit at left and dark gray suit at right is 8.45 feet, which exceeds the required 6 feet minimum distance. Therefore, they are complying with the social distancing guidelines." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5567b6cf713d56c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, smooth skin face at center or silver metallic earring at lower left?" }, { "from": "gpt", "value": "smooth skin face at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0de0326acff1cae.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the black asphalt road at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.411, 0.878)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6aacaa91b500c9b4.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, brown glass bottle at center or amber glass at center?" }, { "from": "gpt", "value": "brown glass bottle at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5cf4359591dc43d.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the matte plastic cup at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.231, 0.562)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b843496e52f24d5d.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer aiming to capture the satin blue heron at center in the image. Since you want to focus on the bird, you need to adjust your camera settings to ensure the clear water at center doesn not overpower the heron. Based on their sizes, which object should you prioritize in your composition?" }, { "from": "gpt", "value": "The clear water at center is bigger than the satin blue heron at center, so you should prioritize focusing on the satin blue heron at center to ensure it remains the main subject despite its smaller size." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16c772410132c8a7.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the yellow fabric shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.927, 0.756)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f8ae281b112ec07.jpg", "conversations": [ { "from": "human", "value": "\nBetween dark brown leather jacket at upper center and light brown hair at upper center, which one is positioned higher?" }, { "from": "gpt", "value": "Positioned higher is dark brown leather jacket at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e180048fb91135b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the denim skirt at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.700, 0.639)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97e456d49d37a77d.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black snowmobile at center closer to camera compared to shiny blue snowmobile at center?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b6c3cf34383d24b.jpg", "conversations": [ { "from": "human", "value": "\nHow close is black puffer jacket at right from camera?" }, { "from": "gpt", "value": "black puffer jacket at right is 14.91 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86810fb7aaf92636.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white matte hard hat at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.787, 0.669)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80ed440eb18fbc4b.jpg", "conversations": [ { "from": "human", "value": "\nIs white fabric banner at center smaller than white plastic pole at upper center?" }, { "from": "gpt", "value": "Correct, white fabric banner at center occupies less space than white plastic pole at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd59825a10cabc3d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.359, 0.597) or point (0.706, 0.578)?" }, { "from": "gpt", "value": "Point (0.706, 0.578) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/061f3798302d24c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.695, 0.870) or point (0.138, 0.986)?" }, { "from": "gpt", "value": "Point (0.138, 0.986)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da7326fcd4fa6b71.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of gray fleece hoodie at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.637, 0.817)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/599deaa058a55524.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between gray matte whale at center and camera?" }, { "from": "gpt", "value": "They are 25.15 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e058b2ed720eff9.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.453, 0.730)?" }, { "from": "gpt", "value": "wooden at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfd5d299a57e5d7d.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between shiny metallic ferris wheel at right and camouflage shorts at lower left." }, { "from": "gpt", "value": "shiny metallic ferris wheel at right and camouflage shorts at lower left are 271.69 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51ec221aeb932ea6.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from white cotton tank top at center to camera." }, { "from": "gpt", "value": "They are 1.85 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eaddcb75fcf95fe8.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.707, 0.397) and camera?" }, { "from": "gpt", "value": "Point (0.707, 0.397) is 109.34 meters from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b78c600d0f9006b.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.460, 0.880) and point (0.965, 0.280), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.460, 0.880)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30ff0450ca444bba.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the venue and want to locate the performer wearing the black matte shirt at center. According to the coordinates provided, where should you look to find them?" }, { "from": "gpt", "value": "The performer wearing the black matte shirt at center is located at the coordinates point (0.510, 0.438), so you should look towards the center of the image slightly to the right and lower middle area." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3ffd44527772abb.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of brown fur bear at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.497, 0.652)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fcef7f7e48c69c2.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of translucent glass at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.285, 0.838)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d69b10a40df3d947.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if snowy granite mountains at upper center is taller than shiny metallic bicycle at center?" }, { "from": "gpt", "value": "Yes, snowy granite mountains at upper center is taller than shiny metallic bicycle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78e0c1cafe6c7806.jpg", "conversations": [ { "from": "human", "value": "\nLocate the brown cobblestone path at center in the image." }, { "from": "gpt", "value": "[(0.732, 0.866)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee63782e2ff2ebbd.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver needing to pass through the traffic jam. You see a white glossy car at center and a matte black suv at left. Which vehicle should you avoid if you want to choose the narrower path between them?" }, { "from": "gpt", "value": "You should avoid the white glossy car at center because its width surpasses the matte black suv at left, making the path between them narrower than the path next to the suv." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a2a818c0532f72f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a designer working on a mobile app that requires precise placement of icons. You need to ensure that the distance between the matte black android at center and the green matte android head at upper center in the design matches the original reference image. What is the exact distance between them?" }, { "from": "gpt", "value": "The exact distance between the matte black android at center and the green matte android head at upper center is 3.56 inches, so you should maintain that distance in your design to match the reference image." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/521904e08519e4df.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.094, 0.839) lie in front of point (0.747, 0.330)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af2bbd4cbaa8748f.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white tile wall at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.713, 0.680)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2eb57b573a195c9.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of natural wood table at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.709, 0.845)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eee2a76ea4899461.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of green mossy rock at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.791, 0.761)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48c12ad92afaaa44.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between green grass at center and camera?" }, { "from": "gpt", "value": "green grass at center is 4.50 meters away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45a75b6e8ae4d426.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.781, 0.963) lie behind point (0.342, 0.236)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8711ed6e967aa507.jpg", "conversations": [ { "from": "human", "value": "\nWhat do you see at coordinate (0.316, 0.548)?" }, { "from": "gpt", "value": "floral silk kimono at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97d117646b5cdc16.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of mahogany glossy table at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.862, 0.416)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/761a62b7a7cda625.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, green grass at center or green textured pine tree at center?" }, { "from": "gpt", "value": "green grass at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a279b0815f02aa3.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the metallic silver table at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.529, 0.814)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40948edd7bf54217.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of dark gray suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.757, 0.583)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0111c76ae6cb298.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.504, 0.692)." }, { "from": "gpt", "value": "satin black gown at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddea7b0c76bb8c6d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at left is taller than white glossy clock at upper center?" }, { "from": "gpt", "value": "Indeed, green leafy tree at left has a greater height compared to white glossy clock at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b01a6e611245b68.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of wooden at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.582, 0.481)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6de9e686fc1a4fef.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, black matte steam engine at center or dark gray suit at center, stands taller?" }, { "from": "gpt", "value": "black matte steam engine at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b86f786276359f6c.jpg", "conversations": [ { "from": "human", "value": "\nIs white metallic clock at upper center closer to camera compared to white stone spire at center?" }, { "from": "gpt", "value": "Yes, white metallic clock at upper center is in front of white stone spire at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c3a0168b324ccab.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.163, 0.766)?" }, { "from": "gpt", "value": "matte black dress at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/358670193cceb586.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.910, 0.514) positioned in front of point (0.015, 0.970)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5076e4dc360c175e.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of point (0.069, 0.748) from camera?" }, { "from": "gpt", "value": "Point (0.069, 0.748) and camera are 5.78 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7bc00015c385e4b.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.491, 0.823)?" }, { "from": "gpt", "value": "brown rocky dirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f0cb964dedb4079.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.619, 0.950) or point (0.862, 0.869)?" }, { "from": "gpt", "value": "Point (0.862, 0.869)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/998977de558573e1.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, dark brown brick chimney at center or black glass lamp post at lower left?" }, { "from": "gpt", "value": "black glass lamp post at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7611dd726827280.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer observing the scene in the bakery. You notice the white fabric apron at center and the smooth white dough at lower left. Which object is taller?" }, { "from": "gpt", "value": "The white fabric apron at center is taller than the smooth white dough at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/381efccbe042a09e.jpg", "conversations": [ { "from": "human", "value": "\nYou are a student in the classroom and want to reach both the point at coordinates (0.919, 0.778) and the point at coordinates (0.092, 0.072). Which point should you walk towards first to reach the closer one first?" }, { "from": "gpt", "value": "You should walk towards point (0.919, 0.778) first because it is closer to you than point (0.092, 0.072)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5569e44c6eeaf3d7.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.767, 0.244) or point (0.809, 0.873)?" }, { "from": "gpt", "value": "Point (0.809, 0.873) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/249eda9872e4e61c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.175, 0.548) or point (0.743, 0.670)?" }, { "from": "gpt", "value": "The point (0.743, 0.670) is behind." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88a5b3f2fadf04e7.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of red paper banner at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.852, 0.541)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a7ee94bfaa3593d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of polished brass handle at left in the image." }, { "from": "gpt", "value": "[(0.231, 0.503)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/713dee1843b1a163.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of leopard print blouse at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.170, 0.681)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2dfed81cba9b2de8.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, white matte suit at center or matte black suit at upper left?" }, { "from": "gpt", "value": "matte black suit at upper left is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7887baddad126bea.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.900, 0.666) and point (0.056, 0.739), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.900, 0.666)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc48c88ad90f8dd2.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.927, 0.816) positioned before point (0.275, 0.698)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d12fa4a18ad9e40d.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room and see two points marked on the floor. The first point is at coordinate point(0.349, 0.920) and the second is at point(0.729, 0.297). Which point is closer to you?" }, { "from": "gpt", "value": "Point(0.349, 0.920) is in front of point(0.729, 0.297), so it is closer to you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d489634a5ea4b906.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the forest and want to reach the point at coordinates point (0.226, 0.128). How far is this point from you?" }, { "from": "gpt", "value": "The point (0.226, 0.128) is 49.92 feet away from you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8096b9ea1cf2cbfe.jpg", "conversations": [ { "from": "human", "value": "\nYou are trying to determine if the green matte watering cans at lower center can fit under the matte blue bench at center. Based on their heights, can they be placed there without exceeding the bench height?" }, { "from": "gpt", "value": "The green matte watering cans at lower center are shorter than the matte blue bench at center, so they can fit under the bench without exceeding its height." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6860cdd5f0ea11b.jpg", "conversations": [ { "from": "human", "value": "\nLocate all red woolen coat at left in the image." }, { "from": "gpt", "value": "[(0.074, 0.591)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b358548c7472790.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to take a photo of the point at coordinates (0.940, 0.261). The camera has a minimum focusing distance of 4 meters. Will the camera be able to focus on the point?" }, { "from": "gpt", "value": "The point at coordinates (0.940, 0.261) is 3.87 meters from the camera, which is less than the minimum focusing distance of 4 meters. Therefore, the camera will not be able to focus on the point." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34ccdb521ad65f96.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow matte minion at upper right is positioned to the right of matte yellow fondant minion at center?" }, { "from": "gpt", "value": "Correct, you'll find yellow matte minion at upper right to the right of matte yellow fondant minion at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/771430449cdce0dd.jpg", "conversations": [ { "from": "human", "value": "\nWhat is at (0.722, 0.673)?" }, { "from": "gpt", "value": "white printed t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64b0848543fa34ae.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up a shot of the glittery sequined ballet skirt at center. If your camera can focus on objects within 30 inches, will you need to adjust your position?" }, { "from": "gpt", "value": "The glittery sequined ballet skirt at center is 33.74 inches away from the camera, which is beyond the 30 inches focus range. You need to move closer to ensure proper focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d22882dadca8b46.jpg", "conversations": [ { "from": "human", "value": "\nDoes white enamel mug at center have a greater width compared to matte white hand at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f7fbbcadf092a50.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.065, 0.981) lie in front of point (0.781, 0.897)?" }, { "from": "gpt", "value": "Yes, point (0.065, 0.981) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/602890e175101ce9.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.989, 0.881) and camera?" }, { "from": "gpt", "value": "18.54 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f65943dd235a1f5e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.588, 0.625) or point (0.910, 0.086)?" }, { "from": "gpt", "value": "Point (0.910, 0.086)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b03473fbdf36d5b8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a delivery driver who needs to park your vehicle in the black asphalt parking lot at center. However, you notice bare branches at upper right nearby. Which direction should you drive to reach the parking lot without passing through the area with the branches?" }, { "from": "gpt", "value": "The black asphalt parking lot at center is positioned on the left side of the bare branches at upper right, so you should drive to the left to reach the parking lot without passing through the area with the branches." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46480e04336d0011.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing 1 meter away from the decorative glass bowl. If you move forward 0.2 meters, will the point at coordinates point (0.246, 0.498) become closer to you?" }, { "from": "gpt", "value": "The distance of point (0.246, 0.498) from viewer is 1.19 meters. Moving forward 0.2 meters from your current position 1 meter away would bring you to 1.2 meters away from the bowl. Since 1.2 meters is farther than 1.19 meters, the point would actually be farther away from you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ed119a5cbbf7cb2.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center to the right of bronze statue at center from the viewer's perspective?" }, { "from": "gpt", "value": "Correct, you'll find green grass at center to the right of bronze statue at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b09e3c719065bd0a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a rock climber assessing the gear setup on the cliff. You notice the shiny black climbing shoes at center and the red synthetic rope at center. Which object appears taller from your vantage point?" }, { "from": "gpt", "value": "The shiny black climbing shoes at center appears taller than the red synthetic rope at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74e9496f82c2dbbb.jpg", "conversations": [ { "from": "human", "value": "\nIs matte white arm at upper center in front of white matte hand at upper center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4e284a9b79baca0.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.695, 0.537) and point (0.409, 0.397), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.409, 0.397)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c18ae13bd1ad461a.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white leather suitcase at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.396, 0.667)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4584be24afcf4c08.jpg", "conversations": [ { "from": "human", "value": "\nDoes white textured couch at lower right have a lesser height compared to denim jeans at center?" }, { "from": "gpt", "value": "Indeed, white textured couch at lower right has a lesser height compared to denim jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b152c8b1734b7cd1.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of multicolored plastic carousel at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.394, 0.334)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f215244486ffdd2.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, trash bags at lower center or rubberized asphalt curb at lower left?" }, { "from": "gpt", "value": "Positioned lower is trash bags at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8298d2e861df2949.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the white matte shirt at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.192, 0.614)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9925983ae98fdd5c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the construction site of the traditional wooden house. There are two points marked on the bamboo roof structure. The first point is at coordinates point (0.749, 0.784) and the second point is at point (0.689, 0.580). Which of these two points is closer to your current position as the observer?" }, { "from": "gpt", "value": "Point (0.749, 0.784) is closer to the camera than point (0.689, 0.580), so the first point is closer to your current position as the observer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8af27b376d007795.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte shirt at center below matte red beanie at center?" }, { "from": "gpt", "value": "Incorrect, black matte shirt at center is not positioned below matte red beanie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d96a696e499aac15.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if transparent glass skulls at center is positioned to the right of brown textured skull at center?" }, { "from": "gpt", "value": "Incorrect, transparent glass skulls at center is not on the right side of brown textured skull at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88370a54247cb454.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper left is shorter than gold polished clock at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62de7f043613d75b.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the metallic wristwatch at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.456, 0.336)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2effd191ec869a08.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, matte red sweater at center or smooth red pepper at center?" }, { "from": "gpt", "value": "smooth red pepper at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfdc917186c936aa.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.457, 0.636) from camera?" }, { "from": "gpt", "value": "The distance of point (0.457, 0.636) from camera is 3.10 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c986f22511606ec9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at upper center is wider than matte black jersey at right?" }, { "from": "gpt", "value": "Correct, the width of green grass at upper center exceeds that of matte black jersey at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbbcb7ca588f05ca.jpg", "conversations": [ { "from": "human", "value": "\nLocate the green leafy plant at lower right in the image." }, { "from": "gpt", "value": "[(0.902, 0.613)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56b1c53ddceb387d.jpg", "conversations": [ { "from": "human", "value": "\nIs dirt road at center positioned behind matte dark brown jacket at center?" }, { "from": "gpt", "value": "No, dirt road at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/643814d53d4563fb.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.267, 0.628) and camera." }, { "from": "gpt", "value": "They are 20.36 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6128a352127123ce.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white blinds at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.066, 0.272)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33ee1ce287bda622.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to walk towards the green grass at center. How far do you need to walk?" }, { "from": "gpt", "value": "The green grass at center is 10.67 feet away from the camera, so you need to walk 10.67 feet to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56d94e5f99e91166.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy hedge at right appear on the left side of gold metallic champagne bottle at center?" }, { "from": "gpt", "value": "Incorrect, green leafy hedge at right is not on the left side of gold metallic champagne bottle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d53e104878f48ba2.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker planning to cross the river. You see the rocky cliff at left and the green matte tree at upper left. Which object would provide a better vantage point to observe the riverbed below?" }, { "from": "gpt", "value": "The rocky cliff at left has a larger size compared to the green matte tree at upper left, so it would provide a better vantage point to observe the riverbed below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1501a60f55080c6f.jpg", "conversations": [ { "from": "human", "value": "\nBetween spotted fur cheetah at center and red matte shirt at center, which one has more height?" }, { "from": "gpt", "value": "red matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f12304e11cc30420.jpg", "conversations": [ { "from": "human", "value": "\nHow close is white fluffy cloud at upper center from camera?" }, { "from": "gpt", "value": "white fluffy cloud at upper center and camera are 614.99 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57053202caf35166.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte brown jacket at lower right have a larger size compared to silver metallic microphone at center?" }, { "from": "gpt", "value": "Indeed, matte brown jacket at lower right has a larger size compared to silver metallic microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6825bb2282371971.jpg", "conversations": [ { "from": "human", "value": "\nHow much distance is there between blue glossy water at center and blue matte ferry boat at center?" }, { "from": "gpt", "value": "65.33 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/acee7fc779cf2a1f.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of silver metallic pole at left. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.141, 0.470)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2788b6382cc3b8b0.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any brown leather strap at center in the image." }, { "from": "gpt", "value": "[(0.665, 0.700)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/362ae272835fd794.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing the office and need to stack items. Which item, the brown cardboard box at center or the checkered fabric at upper left, can be placed on top of a shelf that requires items to be no thicker than 10 cm?" }, { "from": "gpt", "value": "The brown cardboard box at center is thinner than the checkered fabric at upper left, so the brown cardboard box at center can be placed on the shelf since it meets the thickness requirement." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16b17d11777a5a86.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, gray fabric shirt at upper center or matte black hair at upper left?" }, { "from": "gpt", "value": "gray fabric shirt at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/358ee18d43f92716.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.679, 0.491) come farther from viewer compared to point (0.367, 0.711)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.367, 0.711)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d906950d729d44b2.jpg", "conversations": [ { "from": "human", "value": "\nIs camouflage uniform at center below metallic gray drill at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e70afed51c81bbdd.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.657, 0.734) in front of point (0.565, 0.838)?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6858f605f963a0ca.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of smooth bark tree at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.904, 0.361)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ed5a75697e13d74.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.816, 0.872)?" }, { "from": "gpt", "value": "black stone statue at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5576b6d58e490df4.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the gold matte cape at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.865, 0.572)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/177657acae2da8a3.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red cardigan at left shorter than gray knit sweater at center?" }, { "from": "gpt", "value": "Incorrect, matte red cardigan at left's height does not fall short of gray knit sweater at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfeeb048d8997c84.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of white matte shirt at upper left from camera?" }, { "from": "gpt", "value": "white matte shirt at upper left and camera are 18.55 inches apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/781b7a14539f731d.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of clear plastic glass at center in the image." }, { "from": "gpt", "value": "[(0.631, 0.880)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7004e6d5fafe84b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte blazer at right is thinner than white cotton t-shirt at center?" }, { "from": "gpt", "value": "Indeed, black matte blazer at right has a lesser width compared to white cotton t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f818743329190c0.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent blue water at center to the right of clear glass pool at center from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, transparent blue water at center is positioned on the right side of clear glass pool at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b87a688f9fe4609.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of matte red polo shirt at center in the image." }, { "from": "gpt", "value": "[(0.304, 0.642)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfd6aedae0c454c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, yellow metallic excavator at center or brown dirt at center?" }, { "from": "gpt", "value": "brown dirt at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c6eb7399f097399.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth concrete river at lower center positioned at the back of brown brick building at center?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8fcd90d55276250.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, metallic silver fence at center or yellow painted sign at center?" }, { "from": "gpt", "value": "yellow painted sign at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03b1f7f31ae028df.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of yellow matte kayak at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.125, 0.237)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac4c4d1e16f60b77.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from smooth white shirt at center to camera." }, { "from": "gpt", "value": "smooth white shirt at center is 9.98 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2c41b85004820dc.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of orange matte frisbee at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.660, 0.409)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74684e9e58992ea6.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.356, 0.573) from camera?" }, { "from": "gpt", "value": "They are 547.18 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3b34baf2f1202aa.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.340, 0.412) lie behind point (0.171, 0.866)?" }, { "from": "gpt", "value": "Yes, point (0.340, 0.412) is behind point (0.171, 0.866)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4af480f524046d49.jpg", "conversations": [ { "from": "human", "value": "\nBased on the scene description, where is the metallic silver monitor at right located in the image?" }, { "from": "gpt", "value": "The metallic silver monitor at right is located at point (0.914, 0.377)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e57070137cf2417.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of matte white sign at left in the image." }, { "from": "gpt", "value": "[(0.059, 0.291)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/687da224e9564ff1.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.815, 0.773) or point (0.217, 0.570)?" }, { "from": "gpt", "value": "Point (0.217, 0.570) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/181ab744c1990ce1.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.220, 0.212) positioned in front of point (0.566, 0.650)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbb37e7fda272a9d.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue suit at center appear on the right side of purple suede scarf at left?" }, { "from": "gpt", "value": "Indeed, dark blue suit at center is positioned on the right side of purple suede scarf at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04bbef767c00ce7c.jpg", "conversations": [ { "from": "human", "value": "\nDoes green rubber wave at center have a lesser height compared to white smooth surfboard at center?" }, { "from": "gpt", "value": "In fact, green rubber wave at center may be taller than white smooth surfboard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f50b8e7181b64d71.jpg", "conversations": [ { "from": "human", "value": "\nBased on the coordinates provided, which object corresponds to the point at (0.233, 0.658)?" }, { "from": "gpt", "value": "The point at (0.233, 0.658) corresponds to the matte purple jersey at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e17eb4415c9f148.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a white stone castle at center. Pinpoint a point to the white stone castle at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.536, 0.647)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14ac88a4e6a61e4a.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of green grass at upper left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.077, 0.305)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c73aafc4ba49a57.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the blue water at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.717, 0.486)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d96e9cda245e292.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point labeled point (0.244, 0.416) and want to take a photo of the stage. The camera you are using has a focal length of 50mm and a sensor size of 24mm x 36mm. What is the minimum distance you need to move forward or backward to ensure the entire stage fits within your camera frame?" }, { "from": "gpt", "value": "The point labeled point (0.244, 0.416) is 5.65 meters away from the camera. To ensure the entire stage fits within the camera frame, you need to move to a distance where the field of view covers the stage. However, without knowing the stage dimensions, it is impossible to determine the exact required distance. Please provide the stage dimensions for an accurate calculation." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f10eb1c475dc33c.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing 1.5 meters away from the camera. You want to take a photo of the black matte shirt at left. Can you reach the camera to adjust it without moving your position?" }, { "from": "gpt", "value": "The distance between you and the camera is 1.5 meters, and the camera and the black matte shirt at left are 1.24 meters apart. Since 1.5 meters is greater than 1.24 meters, you can reach the camera to adjust it without moving." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94bd5cad01e7fe5c.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.299, 0.245)?" }, { "from": "gpt", "value": "green rough bark tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c4d7cb7f01014c6.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue jacket at lower center appear over light brown fabric jacket at lower left?" }, { "from": "gpt", "value": "Incorrect, dark blue jacket at lower center is not positioned above light brown fabric jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75d8a7672ea7596a.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the white marble statue at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.197, 0.311)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2029061a51edf47.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy hill at lower center in front of matte green helicopter at center?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4c86446d19501a4.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.009, 0.825) behind point (0.463, 0.008)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e0d9bc53732d6d2.jpg", "conversations": [ { "from": "human", "value": "\nHow far is matte gray blazer at center from camera?" }, { "from": "gpt", "value": "matte gray blazer at center is 4.72 feet from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6398b98110261881.jpg", "conversations": [ { "from": "human", "value": "\nYou are a dog owner who wants to ensure both pets have enough space on the couch. Given the presence of the red checkered blanket at upper left and the curly golden fur dog at center, which object takes up more vertical space?" }, { "from": "gpt", "value": "The red checkered blanket at upper left takes up more vertical space since the curly golden fur dog at center is not as tall as it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cd6695a2cfa63b8.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.694, 0.520) or (0.184, 0.736)?" }, { "from": "gpt", "value": "Point (0.184, 0.736)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b2f67cf35ee41c7.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte blue suit at center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.527, 0.606)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3b8ea03a572e51a.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the dark gray rock at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.081, 0.595)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/247e543ce9501b04.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist sketching the scene. You notice the green leafy tree at left and the metallic wire at upper right. Which object should you draw first if you want to follow the rule of drawing smaller objects before larger ones?" }, { "from": "gpt", "value": "The green leafy tree at left should be drawn first because it is smaller than the metallic wire at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb4a86139be68238.jpg", "conversations": [ { "from": "human", "value": "\nIs brown wool sweater at center positioned at the back of gray matte hair at upper left?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0944094ba1fbb352.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue glossy m&m at center appear on the left side of matte red m&m at upper left?" }, { "from": "gpt", "value": "Incorrect, blue glossy m&m at center is not on the left side of matte red m&m at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/036228da49face6b.jpg", "conversations": [ { "from": "human", "value": "\nYou are using a laptop and want to click on one of the two points displayed on the screen. The first point is at coordinate point (0.712, 0.419) and the second is at coordinate point (0.941, 0.833). Since both points are on the screen, which one do you think is closer to the bottom edge of the laptop screen?" }, { "from": "gpt", "value": "Point (0.941, 0.833) is closer to the bottom edge of the laptop screen because its y coordinate is higher than point (0.712, 0.419)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7eab388ff5d6f2c0.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray sweater at left have a larger size compared to dark blue leather jacket at right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18b68601c9dc81db.jpg", "conversations": [ { "from": "human", "value": "\nBetween glossy black refrigerator at left and brushed metal pendant light at upper center, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "brushed metal pendant light at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b83c159ca0c32126.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing on the side of the road and see the point marked at coordinates (0.154, 0.680). If you want to reach that point, how far do you have to walk?" }, { "from": "gpt", "value": "The point at coordinates (0.154, 0.680) is 11.88 meters away from the viewer, so you would need to walk 11.88 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c290dc9e64c074c.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position and want to reach the point marked at coordinates point (0.197, 0.938). How far do you need to walk to get there?" }, { "from": "gpt", "value": "The point marked at coordinates point (0.197, 0.938) is 4.90 meters away from the camera, so you need to walk 4.90 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4343c3cc875cd52d.jpg", "conversations": [ { "from": "human", "value": "\nIs red matte umbrella at center above matte black umbrella at center?" }, { "from": "gpt", "value": "Incorrect, red matte umbrella at center is not positioned above matte black umbrella at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44c3487ee487f681.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green cotton hoodie at center more distant than that of white powder at center?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d61fcf2b2c540f31.jpg", "conversations": [ { "from": "human", "value": "\nBetween clear water at lower right and cloudy sky at upper center, which one is positioned higher?" }, { "from": "gpt", "value": "cloudy sky at upper center is above." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed3a15a14c4681f2.jpg", "conversations": [ { "from": "human", "value": "\nIs snow-covered bush at lower left to the right of green textured pine tree at upper center from the viewer's perspective?" }, { "from": "gpt", "value": "No, snow-covered bush at lower left is not to the right of green textured pine tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/319fffefb482b410.jpg", "conversations": [ { "from": "human", "value": "\nYou are a wildlife photographer standing on a platform. You want to capture a closeup shot of the black glossy penguin at center. Given that your camera has a minimum focusing distance of 2 meters, will you be able to take the photo without moving closer?" }, { "from": "gpt", "value": "The distance between you and the black glossy penguin at center is 2.69 meters, which is greater than the camera minimum focusing distance of 2 meters. Therefore, you can take the photo without moving closer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f323d135562247b8.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue fabric shirt at right have a greater width compared to matte black glasses at upper center?" }, { "from": "gpt", "value": "Yes, blue fabric shirt at right is wider than matte black glasses at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33320e4a66691476.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.538, 0.641)?" }, { "from": "gpt", "value": "maroon satin shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45c3bbc9452b6277.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if pink satin dress at center is thinner than green matte eye at center?" }, { "from": "gpt", "value": "In fact, pink satin dress at center might be wider than green matte eye at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84ccc2d0ec2e1190.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.058, 0.752)?" }, { "from": "gpt", "value": "7.85 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf9f9c45ee1d21d8.jpg", "conversations": [ { "from": "human", "value": "\nDoes black plastic microphone at left appear over black plastic microphone at right?" }, { "from": "gpt", "value": "Actually, black plastic microphone at left is below black plastic microphone at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d92b463de67ca19.jpg", "conversations": [ { "from": "human", "value": "\nDoes white cloth at left lie in front of hardcover book at center?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21e33762110bbc22.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the Shengxing Railway Station and want to take a photo of the point at coordinates (0.320, 0.780). If your camera has a focal length of 50mm and you are 5.85 meters away from the point, will the point be in focus if your depth of field is set to 6 meters?" }, { "from": "gpt", "value": "The point at coordinates (0.320, 0.780) is exactly 5.85 meters from the camera, and the depth of field is set to 6 meters. Since the distance is within the depth of field range, the point will be in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb4f2ef22c9946a7.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room and want to place a 4.5 feet long laptop charger on the wooden table at center. Can you fit the charger on the table without it hanging over the edge?" }, { "from": "gpt", "value": "The wooden table at center is 4.29 feet from viewer. The distance from the viewer does not indicate the table size. Therefore, it is unclear if the 4.5 feet long charger can fit without hanging over the edge based on the provided information." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43ff64757011b1f7.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the purple fabric shirt at lower left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.319, 0.755)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b161358ab1d2b42.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white and brown speckled horse at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.358, 0.452)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29613d3a02fa2862.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of velvet skirt at center?" }, { "from": "gpt", "value": "velvet skirt at center and camera are 1.31 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6ab2287ef9abb93.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the conference room and see the point marked at coordinates (0.333, 0.647). What object is located at that point?" }, { "from": "gpt", "value": "The point at coordinates (0.333, 0.647) indicates the orange fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da4f49e870d15cf4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a teacher observing the classroom scene. You notice the green fabric shirt at center and the white plastic table at upper center. Which object takes up more horizontal space in the image?" }, { "from": "gpt", "value": "The white plastic table at upper center takes up more horizontal space than the green fabric shirt at center because the green fabric shirt at center has a lesser width compared to white plastic table at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2437b0fcfdf3946.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.988, 0.355) closer to viewer compared to point (0.881, 0.567)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.881, 0.567)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d52b4010aa39f57.jpg", "conversations": [ { "from": "human", "value": "\nYou are attending a conference and need to identify which attendee is taller between the black matte shirt at center and the striped cotton shirt at center. Based on the scene, which one is taller?" }, { "from": "gpt", "value": "The black matte shirt at center is taller than the striped cotton shirt at center according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30048ab8f56698f4.jpg", "conversations": [ { "from": "human", "value": "\nLocate the golden fur dog at center in the image." }, { "from": "gpt", "value": "[(0.572, 0.645)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2fed08b6e5e29d77.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.678, 0.655) lie in front of point (0.930, 0.698)?" }, { "from": "gpt", "value": "Yes, point (0.678, 0.655) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01109d639318a4e6.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.690, 0.642) positioned in front of point (0.003, 0.327)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df9db998563afa74.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.479, 0.984) closer to camera compared to point (0.215, 0.775)?" }, { "from": "gpt", "value": "Yes, point (0.479, 0.984) is in front of point (0.215, 0.775)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dec232182148dac0.jpg", "conversations": [ { "from": "human", "value": "\nWhat object lies at (0.562, 0.844)?" }, { "from": "gpt", "value": "white fabric shirt at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68740c0b2358af93.jpg", "conversations": [ { "from": "human", "value": "\nYou are a visitor at this historic site and want to take a photo of the green leafy tree at upper left without the rusty metal railing at lower left in the frame. Which direction should you move to ensure the tree is visible but the railing is not?" }, { "from": "gpt", "value": "Move to the left side so that the green leafy tree at upper left is framed without the rusty metal railing at lower left, since the railing is positioned to the right of the tree." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fabf4ce8aaf9c798.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of black shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.333, 0.859)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ee201171ef597ad.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.985, 0.928) and point (0.822, 0.719), which one is positioned behind?" }, { "from": "gpt", "value": "Point (0.822, 0.719)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c91e0833da172c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object can be found at (0.801, 0.589)?" }, { "from": "gpt", "value": "white printed blouse at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9481934c8540a2ef.jpg", "conversations": [ { "from": "human", "value": "\nBetween translucent plastic bottle at center and translucent glass at table center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, translucent glass at table center appears more on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ceb87b0ca9edc126.jpg", "conversations": [ { "from": "human", "value": "\nIdentify a spot on the black glass street light at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.828, 0.447)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/094ce25e23c706b5.jpg", "conversations": [ { "from": "human", "value": "\nYou are organizing a photo shoot and need to ensure that all clothing items in the scene are visible. Given that the denim jeans at center and the matte gray sweater at left are part of the outfits, which clothing item might be partially obscured if the camera angle is too low?" }, { "from": "gpt", "value": "The denim jeans at center is taller than the matte gray sweater at left, so if the camera angle is too low, the denim jeans at center might partially obscure the matte gray sweater at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1be2f09cffabfa01.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the dirt path in the village and want to reach the rustic wooden hut at right. How far do you need to walk to get there?" }, { "from": "gpt", "value": "The rustic wooden hut at right is 5.00 meters away from you, so you need to walk 5.00 meters to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fa9e48da3753c68.jpg", "conversations": [ { "from": "human", "value": "\nLocate the green jersey at center in the image." }, { "from": "gpt", "value": "[(0.309, 0.492)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d76c741f00fd2c46.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the camera position. You want to take a photo of the couple but need to adjust your position to ensure the point at coordinate point (0.542, 0.347) is in focus. How far should you move forward or backward to achieve this?" }, { "from": "gpt", "value": "The point at coordinate point (0.542, 0.347) is 41.97 meters away from the camera. To focus on this point, you should position yourself so that the camera is exactly 41.97 meters away from the point." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ccab14f5da2827b4.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.400, 0.809) positioned before point (0.311, 0.503)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.311, 0.503)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/675bee37fcd70f1e.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at upper center appear on the left side of brown fur antelope at center?" }, { "from": "gpt", "value": "Yes, green leafy tree at upper center is to the left of brown fur antelope at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eda462e5722638f3.jpg", "conversations": [ { "from": "human", "value": "\nLocate the green stone water at center in the image." }, { "from": "gpt", "value": "[(0.801, 0.597)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/088bdd1705067783.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to install a new decorative element on the house. You have two options to choose from. One is a narrow decorative element that can fit in spaces up to 1 meter wide, and the other is a wider decorative element that requires at least 1.5 meters of space. Based on the image, which decorative element should you choose for the black wrought iron railing at lower left and which for the pink wood shutter at upper left?" }, { "from": "gpt", "value": "The black wrought iron railing at lower left is wider than the pink wood shutter at upper left. Therefore, the wider decorative element should be placed on the black wrought iron railing at lower left, and the narrow decorative element should be placed on the pink wood shutter at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a01612e7883ebca6.jpg", "conversations": [ { "from": "human", "value": "\nIs white satin business suit at center to the right of translucent plastic cup at lower left from the viewer's perspective?" }, { "from": "gpt", "value": "Correct, you'll find white satin business suit at center to the right of translucent plastic cup at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed82caf028e82d14.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in an office and see two points marked on the wall. The first point is at coordinates point (0.340, 0.098) and the second is at point (0.844, 0.278). Which point is closer to you?" }, { "from": "gpt", "value": "Point (0.340, 0.098) is closer to the viewer than point (0.844, 0.278)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/946d34c4c1a1cb76.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.673, 0.608) or (0.162, 0.827)?" }, { "from": "gpt", "value": "Positioned in front is point (0.673, 0.608)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbe17b0c1aadec73.jpg", "conversations": [ { "from": "human", "value": "\nYou are a LEGO enthusiast examining the display table. You notice the gray matte tank at lower left and the translucent plastic minifigures at upper right. Which object is larger in size?" }, { "from": "gpt", "value": "The gray matte tank at lower left is smaller than the translucent plastic minifigures at upper right, so the translucent plastic minifigures at upper right are larger." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/347a4c31a55dd6d3.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the black fabric pants at lower center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.328, 0.906)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db026d5c0a6eaef6.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance measurement between wooden boat at center and matte gray coat at center?" }, { "from": "gpt", "value": "wooden boat at center is 3.10 meters away from matte gray coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82437f5399bb9f81.jpg", "conversations": [ { "from": "human", "value": "\nLocate whiteboard at upper right in the image." }, { "from": "gpt", "value": "[(0.789, 0.375)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/131d33e0988f73c6.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.905, 0.841) closer to camera compared to point (0.460, 0.800)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/466bd4874d9c4991.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is located at (0.222, 0.383)?" }, { "from": "gpt", "value": "white matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eac8c7fcbf2351d3.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the forest and see the point marked at coordinates (0.531, 0.142). Based on the scene description, what object or feature is located at this point?" }, { "from": "gpt", "value": "The point at coordinates (0.531, 0.142) corresponds to a white foggy cloud at upper center in the scene." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a523bf7839695bc4.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to focus on the smooth skin face at upper right and the teethwhitetooth at center in the image. Which of these two objects is closer to the camera?" }, { "from": "gpt", "value": "The smooth skin face at upper right is closer to the viewer than teethwhitetooth at center, so the smooth skin face at upper right is closer to the camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/688c84522734cd05.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a group photo. You notice the black matte tank top at left and the blonde synthetic wig at upper right. Which object is located to the left of the other?" }, { "from": "gpt", "value": "The black matte tank top at left is positioned on the left side of blonde synthetic wig at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4649ca379965987d.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of white fluffy snow at lower center from green matte evergreen tree at lower left?" }, { "from": "gpt", "value": "A distance of 5.01 meters exists between white fluffy snow at lower center and green matte evergreen tree at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c83f2263b335743.jpg", "conversations": [ { "from": "human", "value": "\nCould you provide the distance between velvet couch at center and wooden table at center?" }, { "from": "gpt", "value": "velvet couch at center is 3.88 feet away from wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff0ba0e499cf02e8.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of white matte sign at upper right in the image." }, { "from": "gpt", "value": "[(0.707, 0.497)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfec0f393e026db7.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the church and want to take a photo of the altar area. There is a point at coordinates point (0.834, 0.780) that you need to focus on. What is the distance from your current position to that point?" }, { "from": "gpt", "value": "The distance from your current position to point (0.834, 0.780) is 185.14 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/add175c7696b69e2.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.367, 0.898) or (0.631, 0.920)?" }, { "from": "gpt", "value": "Point (0.631, 0.920)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb6a3e5c0b9b568b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked by coordinates point (0.132, 0.295) in the orchard. Which direction should you walk to reach the green leafy tree at left?" }, { "from": "gpt", "value": "The point (0.132, 0.295) is the location of the green leafy tree at left, so you are already at the tree." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/baee443b92ef9d9f.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, blue smooth water at center or smooth gray dolphin at lower right?" }, { "from": "gpt", "value": "blue smooth water at center is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60bd4f6ea4df32bf.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a portrait of the striped wool scarf at center and the matte skin hand at center. Based on their positions, which object is closer to the camera?" }, { "from": "gpt", "value": "The striped wool scarf at center is closer to the camera because the matte skin hand at center is behind it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3642f093deb8228b.jpg", "conversations": [ { "from": "human", "value": "\nHow far is matte purple eyeshadow at center from camera?" }, { "from": "gpt", "value": "They are 15.65 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5febf64dc56887d6.jpg", "conversations": [ { "from": "human", "value": "\nYou are a bird soaring in the sky and want to land on the water. Given that your wingspan is 1.5 meters, can you safely glide between the cloudy sky at center and the green translucent water at center without hitting any obstacles?" }, { "from": "gpt", "value": "The distance between the cloudy sky at center and the green translucent water at center is 190.74 meters, which is significantly larger than your wingspan of 1.5 meters. Therefore, you can safely glide between them without any issues." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aee4dce070f18ef6.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the blue t-shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.614, 0.589)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e776c1f88e2f2bca.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, yellow smooth pineapple at upper right or orange glossy physalis at lower right?" }, { "from": "gpt", "value": "orange glossy physalis at lower right is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34d6cd2b12938a9d.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of grass at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.522, 0.831)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27ed302596ad51cd.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to choose between two phones in the image to take a clearer photo. The satin black phone at upper center and the matte black phone at upper center are both options. Which phone is taller and might have a larger screen for better framing?" }, { "from": "gpt", "value": "The satin black phone at upper center is taller than the matte black phone at upper center, so it might have a larger screen for better framing." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2004bd2605dc6fb6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position observing the beach scene. There is a point at coordinates point (0.181, 0.864). How far is that point from you?" }, { "from": "gpt", "value": "The distance of point (0.181, 0.864) from camera is 7.23 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cff5a2458e5abc0b.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position in the museum. There is a point marked at coordinates (0.765, 0.327) in the image. How far is that point from your current position?" }, { "from": "gpt", "value": "The point at (0.765, 0.327) is 5.97 meters away from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82cb946527d3e569.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center smaller than light gray stone tower at center?" }, { "from": "gpt", "value": "Incorrect, green leafy tree at center is not smaller in size than light gray stone tower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c95d13b5bb1b893d.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of black plastic video camera at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.285, 0.397)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0775a5e54ed1918.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center have a smaller size compared to white cotton kurta at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a084c83d3c29d3f8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black satin dress at center is bigger than black matte tank top at center?" }, { "from": "gpt", "value": "No, black satin dress at center is not bigger than black matte tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca77784066265601.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic pole at right bigger than metallic pole at lower center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/acda539655f664c5.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fabric canopy at upper center appear on the right side of blonde hair at center?" }, { "from": "gpt", "value": "Incorrect, white fabric canopy at upper center is not on the right side of blonde hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/812693f77c99a5c0.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.453, 0.736) or point (0.241, 0.433)?" }, { "from": "gpt", "value": "Point (0.453, 0.736)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba3cfe6dac755536.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.625, 0.381) positioned behind point (0.230, 0.398)?" }, { "from": "gpt", "value": "No, (0.625, 0.381) is closer to viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16822d0159e68759.jpg", "conversations": [ { "from": "human", "value": "\nIs striped cotton shirt at left further to the viewer compared to black matte shirt at center?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9021d175b05aeacb.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.581, 0.709) positioned behind point (0.807, 0.339)?" }, { "from": "gpt", "value": "Yes, it is behind point (0.807, 0.339)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9f25dd953baa097.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, green grass at center or light blue cotton shirt at center?" }, { "from": "gpt", "value": "Positioned lower is green grass at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a913212f48934de5.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white plastic chair at lower center located? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above." }, { "from": "gpt", "value": "[(0.656, 0.947)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cb116a95b320a34.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer setting up for a panel discussion. You need to ensure that the wooden table at center and the black matte shirt at center are both visible in your shot. Given that your camera has a minimum focus distance of 30 inches, will you be able to capture both objects clearly without moving the camera closer?" }, { "from": "gpt", "value": "The wooden table at center is 30.82 inches from the black matte shirt at center. Since the distance between them is slightly over 30 inches, the camera can focus on both objects as the distance meets the minimum focus requirement." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/551f22672ee439ac.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown stone villa at center is bigger than white plastic lounge chair at lower right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c3ce2a59e05c56f.jpg", "conversations": [ { "from": "human", "value": "\nIs gray stone temple at center smaller than green leafy tree at center?" }, { "from": "gpt", "value": "Incorrect, gray stone temple at center is not smaller in size than green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/438609e1ecf5ebc8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer standing at the starting point of the dirt path. You want to take a photo of the black glossy horse at center from a distance of 10 meters. Based on the scene description, can you position yourself correctly to achieve this?" }, { "from": "gpt", "value": "The black glossy horse at center is 10.30 meters away from the camera. To take a photo from exactly 10 meters away, you need to move slightly closer by 0.30 meters to reduce the distance to the desired 10 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/edbe28c5c1736930.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of shiny dark rock at upper center? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.712, 0.105)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00439b1e36c54082.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow cotton shirt at left is wider than floral-patterned fabric dress at center?" }, { "from": "gpt", "value": "No, yellow cotton shirt at left is not wider than floral-patterned fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be2a36754b80a638.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of blue plaid shorts at right. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.938, 0.239)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b142ce13bd2bb44f.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of matte blue dress at center in the image." }, { "from": "gpt", "value": "[(0.627, 0.592)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/224f444568805f25.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue water at upper center is positioned to the right of green leafy palm tree at center?" }, { "from": "gpt", "value": "In fact, blue water at upper center is to the left of green leafy palm tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/022d79f2a35238fc.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the room where the photo was taken. The black glossy tv at center is showing a live feed of this very room. You want to move closer to the TV so that you can see the screen clearly without straining your eyes. What is the minimum distance you should stand from the TV to ensure you can view it comfortably?" }, { "from": "gpt", "value": "To view the black glossy tv at center comfortably, you should stand at least 9.75 feet away from it, as that is the distance between the TV and the camera, which is likely the optimal viewing distance for the live feed setup." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8e4dd89856e48ab.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue tarpaulin boat at lower right have a larger size compared to wooden planks dock at left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/256f23b2e11b852d.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the white matte van at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.955, 0.500)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2aa74a65da2f0b7a.jpg", "conversations": [ { "from": "human", "value": "\nLocate all gray fabric shirt at lower left in the image." }, { "from": "gpt", "value": "[(0.433, 0.830)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59b2623e0a5e577d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, clear glass window at upper left or multicolored woven duffel at lower left?" }, { "from": "gpt", "value": "multicolored woven duffel at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfe861728aba9608.jpg", "conversations": [ { "from": "human", "value": "\nWhich is below, maroon fabric baseball cap at center-left or matte aluminum helmet at upper center?" }, { "from": "gpt", "value": "maroon fabric baseball cap at center-left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c645a5ba2e3ee1c8.jpg", "conversations": [ { "from": "human", "value": "\nHow close is orange matte beach ball at lower center from orange cotton shorts at lower left?" }, { "from": "gpt", "value": "orange matte beach ball at lower center and orange cotton shorts at lower left are 27.26 inches apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7be8e1cef0b84a9b.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.676, 0.930) and point (0.829, 0.880), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.676, 0.930)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fe4890737dff0a4.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth bark tree at center appear under paper cup at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a57a493f8a68baf.jpg", "conversations": [ { "from": "human", "value": "\nPoint to all occurrences of white stone column at left in the image." }, { "from": "gpt", "value": "[(0.121, 0.656)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c48b4311feb9fda0.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass field at center to the left of green wooden bleachers at left from the viewer's perspective?" }, { "from": "gpt", "value": "No, green grass field at center is not to the left of green wooden bleachers at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8a1edc7abef411a.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any smooth concrete river at center in the image." }, { "from": "gpt", "value": "[(0.708, 0.861)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33e99b75c0676059.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, transparent water at lower center or green patina statue at center, stands taller?" }, { "from": "gpt", "value": "green patina statue at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79a27c73578f8fd7.jpg", "conversations": [ { "from": "human", "value": "\nYou are a city planner analyzing this photograph. You need to determine which of the two objects, the metallic smooth escalator at center or the smooth metal train track at center, occupies a larger area in the image. Based on the scene description, which one is longer?" }, { "from": "gpt", "value": "The smooth metal train track at center is longer than the metallic smooth escalator at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0555a1f17c73207c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if silver metallic video camera at center is positioned above blue matte passport at center-left?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec13e4706bfd1558.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, matte black magazine at lower left or hardcover book at upper left?" }, { "from": "gpt", "value": "matte black magazine at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76bc745005d77d6e.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the black rubber tire at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.861, 0.491)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80363fa3d41426dc.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a closeup shot of the black fleece vest at right and the dark gray jacket at center. Since you want both subjects in focus, you need to adjust your camera settings. Which object should you focus on to ensure both are sharp?" }, { "from": "gpt", "value": "You should focus on the black fleece vest at right because it is closer to the viewer than the dark gray jacket at center. By focusing on the closer object, the depth of field will extend further, increasing the likelihood that both will be in focus." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c399bede84f7b7e2.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between black metal railing at center and camera?" }, { "from": "gpt", "value": "A distance of 88.94 feet exists between black metal railing at center and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b2d5703d201ee49.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.827, 0.558) positioned in front of point (0.420, 0.934)?" }, { "from": "gpt", "value": "Yes, point (0.827, 0.558) is in front of point (0.420, 0.934)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b4ef8b036eedcb5.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of dark brown fur cat at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.192, 0.609)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/484383f48e4e46c1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a group photo of two people wearing maroon striped sweater at center and dark brown sweater at upper center. Since you want to ensure both are clearly visible, which sweater should you focus on to make sure it stands out more in the photo?" }, { "from": "gpt", "value": "The maroon striped sweater at center is bigger than dark brown sweater at upper center, so focusing on the maroon striped sweater at center will ensure it stands out more in the photo." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/743df0eccf5e12f5.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture a clear shot of the black matte tank top at upper center and the dark brown hair at upper left. Since you want to ensure both are visible in the frame, which object should you focus on first to account for their size difference?" }, { "from": "gpt", "value": "The black matte tank top at upper center is bigger than the dark brown hair at upper left, so you should focus on the black matte tank top at upper center first as it occupies more space in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d98b059d247f3a08.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.605, 0.409) and point (0.593, 0.616), which one is positioned in front?" }, { "from": "gpt", "value": "Positioned in front is point (0.593, 0.616)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd38d148b48e8959.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy bowl at center appear on the right side of golden crispy fritters at center?" }, { "from": "gpt", "value": "Incorrect, white glossy bowl at center is not on the right side of golden crispy fritters at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e48be3c30624fd3.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte shirt at center have a greater width compared to blonde hair at lower center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1bada8daa0335f6.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the banquet hall and want to take a photo of the red, vintage wooden box with gold handles. The box is in front of you. There is a point marked at coordinates (0.406, 0.622). How far is that point from you?" }, { "from": "gpt", "value": "The point at (0.406, 0.622) is 1.18 meters away from you." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90f8473968974ec7.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white matte jacket at lower left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.292, 0.584)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfab2123d2f9110e.jpg", "conversations": [ { "from": "human", "value": "\nBetween matte black jacket at left and olive-green leather jacket at center, which one has more height?" }, { "from": "gpt", "value": "With more height is matte black jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7c6bc7e97b6e81f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if purple matte jacket at lower right is wider than metallic gray ship at center?" }, { "from": "gpt", "value": "No, purple matte jacket at lower right is not wider than metallic gray ship at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ecad0a00d4dade3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte van at left is positioned below white matte truck at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82a06e5f21d877a5.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of matte red bus at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.530, 0.392)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f21e1343cd6819ed.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to green mossy rock at upper center? Please provide its 2D coordinates.Where can I find green mossy rock at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.545, 0.550)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c780ded872f3c7a.jpg", "conversations": [ { "from": "human", "value": "\nBetween red paper lantern at upper right and red paper lantern at upper left, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "red paper lantern at upper left is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85371408226df92f.jpg", "conversations": [ { "from": "human", "value": "\nIs black fabric baseball cap at upper left to the right of dark glass bottles at center from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, black fabric baseball cap at upper left is positioned on the right side of dark glass bottles at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/154315e5ec7ccf8b.jpg", "conversations": [ { "from": "human", "value": "\nHow far apart are white glossy car at center and matte silver sedan at center?" }, { "from": "gpt", "value": "A distance of 79.04 feet exists between white glossy car at center and matte silver sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0b16ee4d4b7ebcb.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of pink fabric at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.314, 0.747)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6b9d2cacc6fbf06.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the depth value of point (0.095, 0.439)?" }, { "from": "gpt", "value": "Point (0.095, 0.439) and camera are 19.46 feet apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b358e829db49790.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.538, 0.291) from camera?" }, { "from": "gpt", "value": "Point (0.538, 0.291) and camera are 1194.38 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3444fc51319a016.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.510, 0.100) behind point (0.921, 0.766)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10448180076db691.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any transparent blue water at center in the image." }, { "from": "gpt", "value": "[(0.543, 0.445)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b08ab3de6872d15.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.281, 0.725) to camera." }, { "from": "gpt", "value": "They are 1.16 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/621864bd1eab933d.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth sand at center appear under purple matte jacket at center?" }, { "from": "gpt", "value": "Incorrect, smooth sand at center is not positioned below purple matte jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e01867bd2ae3cefb.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the lion in the center. You notice a point at coordinates (0.459, 0.458). Is this point located on the lion?" }, { "from": "gpt", "value": "Yes, the point at coordinates (0.459, 0.458) is located on the fuzzy brown lion at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c801d7238cc32a2c.jpg", "conversations": [ { "from": "human", "value": "\nLocate the blue plaid shirt at center in the image." }, { "from": "gpt", "value": "[(0.491, 0.627)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef23bd0f2525d877.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from translucent plastic soap dispenser at lower left to camera." }, { "from": "gpt", "value": "translucent plastic soap dispenser at lower left is 8.09 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fd8552e5b37146b.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer planning to capture the Empire State Building. You notice the glassy reflective skyscraper at center and the gold metallic spire at center. Which object should you focus on if you want to photograph the larger one?" }, { "from": "gpt", "value": "The glassy reflective skyscraper at center is bigger than the gold metallic spire at center, so you should focus on the glassy reflective skyscraper at center to photograph the larger one." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce4b61faad5d5fe5.jpg", "conversations": [ { "from": "human", "value": "\nWho is positioned more to the right, brown thatch roof at center or green grass at lower center?" }, { "from": "gpt", "value": "green grass at lower center is more to the right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3cdb43c8325505a6.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer trying to capture the smooth concrete pavement at lower right and the white cotton blouse at lower center in a single frame. Given that your camera can only focus on one object at a time, which object should you prioritize focusing on to ensure it appears sharp and clear in the photo?" }, { "from": "gpt", "value": "You should prioritize focusing on the smooth concrete pavement at lower right because it is bigger than the white cotton blouse at lower center, making it more prominent in the frame." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bcac8e3f8054e97.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.098, 0.397) come in front of point (0.808, 0.736)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a850bcad97a9639.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of green checkered shirt at center from camera?" }, { "from": "gpt", "value": "1.73 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa0a5234854e5646.jpg", "conversations": [ { "from": "human", "value": "\nIs satin yellow dress at center further to the viewer compared to black satin cape at right?" }, { "from": "gpt", "value": "No, satin yellow dress at center is in front of black satin cape at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7781620747f74721.jpg", "conversations": [ { "from": "human", "value": "\nBased on the scene description, where is the black and white zigzag dress at center located in terms of coordinates?" }, { "from": "gpt", "value": "The black and white zigzag dress at center is located at coordinates point (0.715, 0.637)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc5c4c33b8af702f.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.931, 0.277) or (0.777, 0.853)?" }, { "from": "gpt", "value": "Point (0.777, 0.853)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02884c22a48376e5.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.327, 0.688) come closer to viewer compared to point (0.334, 0.803)?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f554e4cd7eb359fd.jpg", "conversations": [ { "from": "human", "value": "\nYou are planning to build a small garden near the shelter. Based on the image, which object is closer to you if you are standing at the shelter? The brown rocky mountain at upper center or the brown sandy ground at center?" }, { "from": "gpt", "value": "The brown rocky mountain at upper center is closer to you because the brown sandy ground at center is behind it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d5d7444390a276c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of neon yellow safety vest at right? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.705, 0.553)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0d2bbb0318e8f61.jpg", "conversations": [ { "from": "human", "value": "\nHow close is green mossy bark tree trunk at center from green mossy rock at lower right?" }, { "from": "gpt", "value": "6.07 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6d832414cc2dc58.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between point (0.845, 0.761) and camera." }, { "from": "gpt", "value": "Point (0.845, 0.761) and camera are 6.51 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b00ea4c48dda5377.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, smooth white shirt at center or smooth bald head at lower left, stands taller?" }, { "from": "gpt", "value": "Standing taller between the two is smooth white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8615eb366dda8176.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any translucent glass perfume at center in the image." }, { "from": "gpt", "value": "[(0.358, 0.470)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4503a57cf99f875.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the green leafy hillside at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.471, 0.359)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e640a24031c343f8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and want to capture a photo that includes both the navy blue uniform at center and the maroon beret at left. Based on their positions, which one should you place on the left side of the photo to ensure both are visible?" }, { "from": "gpt", "value": "The maroon beret at left should be placed on the left side of the photo because the navy blue uniform at center is positioned to its right, meaning the maroon beret is already on the left relative to the navy blue uniform." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f5616961436748a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the base of the monument looking towards the central plaza. There are two points marked on the lawn. Which point is closer to you, point (0.898, 0.873) or point (0.190, 0.744)?" }, { "from": "gpt", "value": "Point (0.898, 0.873) is closer to you than point (0.190, 0.744)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab663876164e9d95.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown hair at center thinner than light blue shirt at right?" }, { "from": "gpt", "value": "No, dark brown hair at center is not thinner than light blue shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c8e5d15a83278e7.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.610, 0.330) and point (0.512, 0.487), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.610, 0.330) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b59d4ab679834be3.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the entrance of the modern architectural structure and notice a specific point marked at coordinates point (0.368, 0.817). Based on the scene description, can you determine what material this point is located on?" }, { "from": "gpt", "value": "The point (0.368, 0.817) is located on the matte red barn at center, which is made of vibrant red panels." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8286dc8a48ff57de.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the black matte turtleneck sweater at left. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.266, 0.389)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5fedb1747c5347b.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown gravel dirt track at lower center appear over green leafy tree at left?" }, { "from": "gpt", "value": "Actually, brown gravel dirt track at lower center is below green leafy tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba7b8e4e5b92923d.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, brown leather jacket at center or brown woolen jacket at lower left?" }, { "from": "gpt", "value": "brown woolen jacket at lower left is lower down." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e7bab0d4ac1933f.jpg", "conversations": [ { "from": "human", "value": "\nIs plaid fabric shirt at lower left positioned before light brown leather shoes at lower center?" }, { "from": "gpt", "value": "Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56e2ce9a34e2269f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a customer in the supermarket and want to place both the yellow matte spice at center and the matte black shirt at center into your shopping basket. Which item should you place first to ensure both fit properly?" }, { "from": "gpt", "value": "You should place the matte black shirt at center first because it is larger in size compared to the yellow matte spice at center, allowing the smaller item to fit into any remaining space." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8abd0b6cebd1b60b.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown guitar at lower left bigger than matte brown guitar at center?" }, { "from": "gpt", "value": "Actually, matte brown guitar at lower left might be smaller than matte brown guitar at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10c8be17391df9c8.jpg", "conversations": [ { "from": "human", "value": "\nYou are a pedestrian standing on the black metal rail at lower left and want to cross to the other side of the river. Is the metallic gray bridge at center above or below your current position?" }, { "from": "gpt", "value": "The black metal rail at lower left is positioned under the metallic gray bridge at center, so the bridge is above your current position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eff71b4f81d486a0.jpg", "conversations": [ { "from": "human", "value": "\nDoes black rubber penguin at center have a greater height compared to white matte penguin at right?" }, { "from": "gpt", "value": "In fact, black rubber penguin at center may be shorter than white matte penguin at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e6fc758fefc1814.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of blue fabric uniform at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.543, 0.555)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/194ef0e4d35e664f.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.795, 0.795) come closer to viewer compared to point (0.513, 0.261)?" }, { "from": "gpt", "value": "That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd9095717f35455c.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white smooth stupa at left? Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.230, 0.736)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99a0afb1df7e226d.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is smooth brown water at center from brown rough wood log at lower center?" }, { "from": "gpt", "value": "smooth brown water at center and brown rough wood log at lower center are 12.94 meters apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86950c7cb7af0ad9.jpg", "conversations": [ { "from": "human", "value": "\nBetween clear glass window at center and matte white window at upper left, which one appears on the right side from the viewer's perspective?" }, { "from": "gpt", "value": "From the viewer's perspective, clear glass window at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06f1f08d99abf348.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the lakeside and want to take a photo of both the blue wooden hut at center and the yellow leafy tree at upper center. If your camera can capture objects up to 50 feet away, will both be in focus?" }, { "from": "gpt", "value": "The blue wooden hut at center is 47.74 feet away from the yellow leafy tree at upper center. Since the camera can capture up to 50 feet, both objects will be in focus as the distance between them is within the camera range." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df207e7ad297ef97.jpg", "conversations": [ { "from": "human", "value": "\nCan you provide the distance between point (0.324, 0.822) and camera?" }, { "from": "gpt", "value": "The distance of point (0.324, 0.822) from camera is 3.70 meters." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7494cbb38ddf6684.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of matte wood shed at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.553, 0.780)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a0f9a953a8b810a.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue striped umbrella at center have a lesser width compared to green fabric beach chair at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/623765d69558495d.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.428, 0.747) and camera." }, { "from": "gpt", "value": "Point (0.428, 0.747) is 6.70 inches from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/386dd67d735a3d0a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a hiker who has just started your journey in the desert. You see the desert soil at center and the rustic rock formation at center. How far apart are these two landmarks?" }, { "from": "gpt", "value": "The distance between the desert soil at center and the rustic rock formation at center is 619.95 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87c00c42a17c2433.jpg", "conversations": [ { "from": "human", "value": "\nYou are an engineer inspecting the water treatment facility. You notice the metallic water at center and the metallic silver platform at center. Which one has a larger surface area?" }, { "from": "gpt", "value": "The metallic water at center has a larger surface area than the metallic silver platform at center because it is bigger." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0fcf295b445ceaa.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow matte truck at center is positioned to the right of dark blue uniform at center?" }, { "from": "gpt", "value": "Yes, yellow matte truck at center is to the right of dark blue uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2cf64084100f759.jpg", "conversations": [ { "from": "human", "value": "\nPoint to metallic steel bridge at center.Point to the metallic steel bridge at center in the image." }, { "from": "gpt", "value": "[(0.474, 0.562)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2424fb95bb17927c.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the blue cotton shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.200, 0.694)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95698d964e3a9da7.jpg", "conversations": [ { "from": "human", "value": "\nSelect a point on the dark gray suit at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.507, 0.589)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c99a4748fb50a3fd.jpg", "conversations": [ { "from": "human", "value": "\nCan you find the matte black camera at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.516, 0.588)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3c62fc524fc2186.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.800, 0.542) and point (0.342, 0.580), which one is positioned behind?" }, { "from": "gpt", "value": "Positioned behind is point (0.800, 0.542)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8229d9fefac26dcc.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue water at center lie in front of metallic gray suspension bridge at center?" }, { "from": "gpt", "value": "Yes, blue water at center is in front of metallic gray suspension bridge at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24beeb17aad92a8c.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the translucent plastic fish at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.317, 0.930)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/849dd6ec0d6d5275.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.117, 0.292) from the camera?" }, { "from": "gpt", "value": "A distance of 4.41 meters exists between point (0.117, 0.292) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2bcb875419de4d5.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.254, 0.277) and point (0.158, 0.356), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.158, 0.356) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ff2d0b7554363f3.jpg", "conversations": [ { "from": "human", "value": "\nBetween green grass at lower left and green leafy hedge at center, which one appears on the left side from the viewer's perspective?" }, { "from": "gpt", "value": "green leafy hedge at center is more to the left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2cb36a36d823280.jpg", "conversations": [ { "from": "human", "value": "\nCould you measure the distance between transparent glass windshield at center and white plastic license plate at center?" }, { "from": "gpt", "value": "They are 23.63 inches apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c4e9a1311a28275.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the distance between red fabric vest at right and red glossy strawberries at lower right?" }, { "from": "gpt", "value": "A distance of 1.42 meters exists between red fabric vest at right and red glossy strawberries at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26c18a8436a12acc.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, concrete at lower right or white glossy cruise ship at center?" }, { "from": "gpt", "value": "concrete at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/446e0179d7d1e595.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.151, 0.561) and point (0.971, 0.422), which one is positioned in front?" }, { "from": "gpt", "value": "Point (0.971, 0.422) is more forward." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/977ee1c236c29163.jpg", "conversations": [ { "from": "human", "value": "\nIs concrete at center to the right of matte red tail at upper center from the viewer's perspective?" }, { "from": "gpt", "value": "Indeed, concrete at center is positioned on the right side of matte red tail at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86cd54c248518669.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of green grass at lower center from brown gravel driveway at lower left?" }, { "from": "gpt", "value": "3.25 meters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfdbbc6249a21320.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte t-shirt at center appear on the right side of white striped shirt at upper right?" }, { "from": "gpt", "value": "In fact, black matte t-shirt at center is to the left of white striped shirt at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c83e0680bcb8b6c7.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.615, 0.553) from camera?" }, { "from": "gpt", "value": "A distance of 174.07 meters exists between point (0.615, 0.553) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/405c18d4d796ab2a.jpg", "conversations": [ { "from": "human", "value": "\nCan you tell me the distance of metallic silver van at upper right from camera?" }, { "from": "gpt", "value": "A distance of 16.62 feet exists between metallic silver van at upper right and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea88f4a3db609eda.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in a conference room and need to reach a point marked at coordinates point (0.342, 0.691). If you are currently 1.51 meters away from this point, how far do you need to move to reach it?" }, { "from": "gpt", "value": "You need to move 1.51 meters to reach the point (0.342, 0.691) since you are currently 1.51 meters away from it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b07522ecbba679b1.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any gray water at center in the image." }, { "from": "gpt", "value": "[(0.211, 0.578)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7d7964668285080.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, brown wooden fence at center or shiny blue helmet at center, stands shorter?" }, { "from": "gpt", "value": "brown wooden fence at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e93e5c966724c98.jpg", "conversations": [ { "from": "human", "value": "\nCan you give me an estimation of the distance between point (0.646, 0.623) and camera?" }, { "from": "gpt", "value": "Point (0.646, 0.623) is 6.74 feet away from camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c7b057649fc76f7.jpg", "conversations": [ { "from": "human", "value": "\nSelect a location on the peace sign tank top at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.115, 0.506)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d13bbe1f57dcdf6.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear glass pool at center appear under dark blue jeans at right?" }, { "from": "gpt", "value": "Yes, clear glass pool at center is below dark blue jeans at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4dac44ff4264da18.jpg", "conversations": [ { "from": "human", "value": "\nIs argyle-patterned shirt at center to the right of light brown fabric stroller at center from the viewer's perspective?" }, { "from": "gpt", "value": "Correct, you'll find argyle-patterned shirt at center to the right of light brown fabric stroller at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1df28f7d7315b8b.jpg", "conversations": [ { "from": "human", "value": "\nHow close is matte jersey at center from matte red vest at center?" }, { "from": "gpt", "value": "matte jersey at center and matte red vest at center are 17.54 inches apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78a4848cd4b25a2f.jpg", "conversations": [ { "from": "human", "value": "\nYou are a student in the classroom and need to choose a monitor to work on. Which monitor, the matte black monitor at center or the black glossy monitor at center, would you choose if you want a larger screen?" }, { "from": "gpt", "value": "The black glossy monitor at center is larger than the matte black monitor at center, so you should choose the black glossy monitor at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/429e7400f835fd49.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from velvety blue pillow at upper left to camera." }, { "from": "gpt", "value": "velvety blue pillow at upper left and camera are 11.96 feet apart from each other." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af7eb45034299d2b.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between green leafy hand at center and camera." }, { "from": "gpt", "value": "28.86 centimeters" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aca757abf57aecca.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.699, 0.828) or (0.661, 0.520)?" }, { "from": "gpt", "value": "Point (0.661, 0.520)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bbfbd42e38cd2984.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.508, 0.416) or point (0.428, 0.467)?" }, { "from": "gpt", "value": "Point (0.508, 0.416)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ce7f30aa757acf0.jpg", "conversations": [ { "from": "human", "value": "\nYou are an observer looking at the photograph of the two windows. You notice the smooth black leather dress at center and the smooth skin hand at center. Which object is covering the other?" }, { "from": "gpt", "value": "The smooth black leather dress at center is positioned over the smooth skin hand at center, so the dress is covering the hand." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31e0e8f0146f8dd7.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the interior space and want to exit through the doorway. Which direction should you walk to avoid the wooden sign at left?" }, { "from": "gpt", "value": "To exit through the doorway while avoiding the wooden sign at left, you should walk towards the right side of the interior space since the wooden sign at left is located on the left side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7106ebeb4f89b2bd.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white cotton t-shirt at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.529, 0.595)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70da8bef6858209c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the right, green mossy branch at center or green matte tree at center?" }, { "from": "gpt", "value": "From the viewer's perspective, green mossy branch at center appears more on the right side." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d348d673c24e877.jpg", "conversations": [ { "from": "human", "value": "\nBetween blonde hair at center and blonde silky hair at center, which one is positioned higher?" }, { "from": "gpt", "value": "blonde silky hair at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/670bd7824e7eea1a.jpg", "conversations": [ { "from": "human", "value": "\nChose the point of smooth concrete sidewalk at center. Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.745, 0.795)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc87ffd7cd8185bb.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of metallic blue seats at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.695, 0.830)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77af90ae4f253ca1.jpg", "conversations": [ { "from": "human", "value": "\nIn the scene under the corrugated metal roof, there are two shirts displayed at the center. The light blue shirt at center and the plaid fabric shirt at center. Which one is positioned to the right?" }, { "from": "gpt", "value": "The light blue shirt at center is positioned to the right of the plaid fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66437361a63422f7.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.751, 0.200) or (0.035, 0.380)?" }, { "from": "gpt", "value": "The point (0.035, 0.380) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2546fa59d00f71b.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of gray fabric camera at left? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.138, 0.681)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/358f229aa8895684.jpg", "conversations": [ { "from": "human", "value": "\nBetween yellow matte apple at center and green matte apple at center, which one is positioned higher?" }, { "from": "gpt", "value": "yellow matte apple at center is higher up." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50a1b74d8868ba06.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.948, 0.578) and camera." }, { "from": "gpt", "value": "The distance of point (0.948, 0.578) from camera is 3.82 feet." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f84ec5b686a6f9a7.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.869, 0.323) and camera." }, { "from": "gpt", "value": "Point (0.869, 0.323) and camera are 224.07 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67d60c192215fa7a.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in the public square and see the maroon hoodie at center and the transparent glass bubble at center. Which object is positioned to the right?" }, { "from": "gpt", "value": "The maroon hoodie at center is positioned to the right of the transparent glass bubble at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/241ad005c14bf9ae.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of white ceramic saucer at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.505, 0.952)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09543f5eeeef243a.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black phone at center have a greater width compared to dark brown silky hair at center?" }, { "from": "gpt", "value": "Correct, the width of matte black phone at center exceeds that of dark brown silky hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cba14125b5aa242.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.323, 0.102) and point (0.133, 0.320), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.133, 0.320) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/179bc19f0aedad55.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.239, 0.692) or (0.503, 0.675)?" }, { "from": "gpt", "value": "Point (0.239, 0.692) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc1c53d67b39451a.jpg", "conversations": [ { "from": "human", "value": "\nPoint to any gray stone statue at center in the image." }, { "from": "gpt", "value": "[(0.621, 0.373)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a082aa16132f1e26.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the historic building and want to take a photo of the brown stone church at center without any obstructions. Are the frosted white branches at center blocking your view of the church?" }, { "from": "gpt", "value": "The frosted white branches at center are in front of the brown stone church at center, so they are blocking the view of the church. You would need to move the branches or find a different angle to capture an unobstructed photo of the church." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9fb8b3f30cfd0fc.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the bronze statue at upper center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.354, 0.089)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4abf535ed622fd9.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.181, 0.245) come farther from viewer compared to point (0.842, 0.225)?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c022928318d2ac17.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.242, 0.956) come farther from viewer compared to point (0.165, 0.342)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/296a08524d35fe4a.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a dark gray hoodie at center. Pinpoint a point to the dark gray hoodie at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.757, 0.502)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/253524a2410ae18b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is behind, point (0.023, 0.506) or point (0.888, 0.445)?" }, { "from": "gpt", "value": "Point (0.888, 0.445)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64fabaca7808c251.jpg", "conversations": [ { "from": "human", "value": "\nBetween point (0.911, 0.703) and point (0.203, 0.391), which one is positioned behind?" }, { "from": "gpt", "value": "The point (0.911, 0.703) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9fc7d94af55ffa74.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.135, 0.495) farther from viewer compared to point (0.634, 0.884)?" }, { "from": "gpt", "value": "Yes, point (0.135, 0.495) is behind point (0.634, 0.884)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6153ed1e08d26c79.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of brown leather bag at lower right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.920, 0.861)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8787ffb12c8ace1d.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.635, 0.812) come in front of point (0.514, 0.406)?" }, { "from": "gpt", "value": "Yes, point (0.635, 0.812) is in front of point (0.514, 0.406)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15af8817bd778596.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray hoodie at center lie behind matte plastic toy sword at left?" }, { "from": "gpt", "value": "Yes, gray hoodie at center is further from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d6037c7db4e2432.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.645, 0.423) or (0.613, 0.770)?" }, { "from": "gpt", "value": "Positioned in front is point (0.645, 0.423)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c7523053bd6c07a.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the event and need to capture a clear photo of the matte black blouse at center and the floral fabric kimono at center. Which one is closer to the camera?" }, { "from": "gpt", "value": "The matte black blouse at center is closer to the camera since the floral fabric kimono at center is behind it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0aa36ea4c2c16b9a.jpg", "conversations": [ { "from": "human", "value": "\nIs light blue wood door at center below white plastic street sign at center?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ef1add3026bb211.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black jacket at center is shorter than black fabric helmet at lower left?" }, { "from": "gpt", "value": "No, matte black jacket at center is not shorter than black fabric helmet at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef4cac4726094651.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center smaller than wooden cabin at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ccfa5305c441a356.jpg", "conversations": [ { "from": "human", "value": "\nWho is more forward, (0.669, 0.981) or (0.198, 0.713)?" }, { "from": "gpt", "value": "Point (0.669, 0.981) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1fb3bd82786b6632.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the location of black matte shirt at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.358, 0.655)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0a677aaa3aed1bf.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between blue glossy kayak at center and camera." }, { "from": "gpt", "value": "blue glossy kayak at center and camera are 4.11 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b076242381370b5.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the point marked by coordinates point (0.551, 0.528) in the image. What object is directly in front of you?" }, { "from": "gpt", "value": "The point (0.551, 0.528) indicates the matte green military vehicle at center, so the object directly in front of you is the matte green military vehicle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6120a65084903ac2.jpg", "conversations": [ { "from": "human", "value": "\nIn the traditional setting, there are two red robes present. The red velvet robe at lower right and the red silk robe at center. Which one is taller?" }, { "from": "gpt", "value": "The red velvet robe at lower right is taller than the red silk robe at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e7cda01e869e153.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a yellow rubber snake at right. Pinpoint a point to the yellow rubber snake at right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.873, 0.572)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/218d5c705ff611f6.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to burgundy fabric umbrella at center? Please provide its 2D coordinates.Where can I find burgundy fabric umbrella at center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.750, 0.283)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85fb1c36adcb28c9.jpg", "conversations": [ { "from": "human", "value": "\nWho is more distant from viewer, (0.512, 0.942) or (0.470, 0.842)?" }, { "from": "gpt", "value": "The point (0.512, 0.942) is more distant." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34a454b9bd9e5a76.jpg", "conversations": [ { "from": "human", "value": "\nWho is shorter, brown dirt field at lower center or white metallic water tower at upper right?" }, { "from": "gpt", "value": "brown dirt field at lower center is shorter." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8dbf9399e1c82582.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between camouflage-patterned jacket at center and camera." }, { "from": "gpt", "value": "camouflage-patterned jacket at center and camera are 76.60 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ccf5aa7175aa7146.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the origin point in the image and want to reach the green leafy tree at center. Which direction should you move to get there?" }, { "from": "gpt", "value": "The green leafy tree at center is located at point 0.764 on the x and 0.492 on the y. Since you are at the origin, you should move towards the right and slightly upwards to reach it." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e54bf68845773bbe.jpg", "conversations": [ { "from": "human", "value": "\nWho is lower down, gray striped shirt at left or floral fabric baby at center?" }, { "from": "gpt", "value": "Positioned lower is gray striped shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb43c24ba7ea5107.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black couch at upper left below natural stone at lower right?" }, { "from": "gpt", "value": "No, matte black couch at upper left is not below natural stone at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd5362ee2940e9fb.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.269, 0.567) positioned before point (0.836, 0.814)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/703e92e011bab2e7.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the camera position looking at the market stall. There is a point marked at coordinates point (0.646, 0.433). How far is that point from you?" }, { "from": "gpt", "value": "The point (0.646, 0.433) is 2.00 meters away from the camera position." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a159410f0f8eb7ff.jpg", "conversations": [ { "from": "human", "value": "\nDescribe the object at (0.285, 0.339)." }, { "from": "gpt", "value": "matte black t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a8ac73697ff7056.jpg", "conversations": [ { "from": "human", "value": "\nTell me the distance between green leafy palm at center and camera." }, { "from": "gpt", "value": "green leafy palm at center and camera are 87.57 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66ce9ea42c40b0d6.jpg", "conversations": [ { "from": "human", "value": "\nLocate floral cotton dress at center in the image." }, { "from": "gpt", "value": "[(0.438, 0.803)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/325a33705192b743.jpg", "conversations": [ { "from": "human", "value": "\nWhich is more to the left, metallic silver bulletin board at center or hardcover book at right?" }, { "from": "gpt", "value": "metallic silver bulletin board at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a7485b7a625bb57.jpg", "conversations": [ { "from": "human", "value": "\nWhere is teal frosting at upper right located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.853, 0.214)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4e45ff8baedba7a.jpg", "conversations": [ { "from": "human", "value": "\nWhere is smooth bark tree at upper left located? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.121, 0.120)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfec5f6020853cbd.jpg", "conversations": [ { "from": "human", "value": "\nCan you point to white fluffy cloud at upper center? Please provide its 2D coordinates.Where can I find white fluffy cloud at upper center? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.589, 0.195)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e32b445aa22722b2.jpg", "conversations": [ { "from": "human", "value": "\nHow far is point (0.172, 0.566) from the camera?" }, { "from": "gpt", "value": "They are 15.49 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb296acb46b991fc.jpg", "conversations": [ { "from": "human", "value": "\nBased on the scene, can you tell me what is located at the coordinates point (0.515, 0.205)?" }, { "from": "gpt", "value": "At point (0.515, 0.205) lies dark gray crowd at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de928291596fba6f.jpg", "conversations": [ { "from": "human", "value": "\nLocate a point on the stone archway at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.656, 0.536)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a610b1247c40f29e.jpg", "conversations": [ { "from": "human", "value": "\nDoes wet skin foot at center have a lesser height compared to glossy black toe at center?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af9b7d221eb00118.jpg", "conversations": [ { "from": "human", "value": "\nGive me the distance from point (0.539, 0.831) to camera." }, { "from": "gpt", "value": "A distance of 41.17 meters exists between point (0.539, 0.831) and camera." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0211e8d15fd6bbc.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing at the origin point of the coordinate system in the image. You need to move to the wooden ladder at left. What are the coordinates you should move to?" }, { "from": "gpt", "value": "The coordinates for the wooden ladder at left are at point (0.175, 0.605)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2aba36a24abe94c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic gray escalator steps at center is positioned above matte orange wall at right?" }, { "from": "gpt", "value": "Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a81702d53b787ee3.jpg", "conversations": [ { "from": "human", "value": "\nIs white rocky mountain at upper center below orange matte dress at lower left?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee7306bc75bf8d96.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of wire mesh fence at lower left less distant than that of rusty metal rail at lower center?" }, { "from": "gpt", "value": "No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/279d3764780ba6ca.jpg", "conversations": [ { "from": "human", "value": "\nWhich is in front, point (0.221, 0.653) or point (0.259, 0.695)?" }, { "from": "gpt", "value": "Point (0.221, 0.653) is in front." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/884fddbb30371c17.jpg", "conversations": [ { "from": "human", "value": "\nYou are standing in front of the solar panel at the outdoor event. You notice two points marked on the structure. The first point is at coordinates point (0.791, 0.505) and the second is at point (0.854, 0.578). From your viewpoint, which point is closer to you?" }, { "from": "gpt", "value": "Point (0.854, 0.578) is closer to you because the description states that point (0.791, 0.505) is behind point (0.854, 0.578)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5e808ce4a623e76.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between point (0.629, 0.830) and camera." }, { "from": "gpt", "value": "They are 3.21 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33a0eb270fd394b2.jpg", "conversations": [ { "from": "human", "value": "\nDoes american flag at center appear on the left side of patterned fabric headdress at center?" }, { "from": "gpt", "value": "In fact, american flag at center is to the right of patterned fabric headdress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/719f43e8a40b6982.jpg", "conversations": [ { "from": "human", "value": "\nYou are a city planner analyzing the urban layout. Given the brown glassy building at upper center and the brown glass building at center, which one has a greater width according to the aerial view?" }, { "from": "gpt", "value": "The brown glassy building at upper center has a greater width than the brown glass building at center as stated in the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7ade9e9e1bc5292.jpg", "conversations": [ { "from": "human", "value": "\nGive me the position of maroon fabric shirt at lower right. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.772, 0.478)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38e6457822ad8824.jpg", "conversations": [ { "from": "human", "value": "\nHow far apart are white matte sweatshirt at center and yellow paper at upper center?" }, { "from": "gpt", "value": "They are 95.47 centimeters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9bfa540ac8f2c2e.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth bark tree at center bigger than gold metallic bicycle at lower left?" }, { "from": "gpt", "value": "Correct, smooth bark tree at center is larger in size than gold metallic bicycle at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b47e0b8580b5c3f4.jpg", "conversations": [ { "from": "human", "value": "\nYou are an artist trying to paint the sunset scene. You want to ensure the silhouette tree at upper center and the silhouette leafy tree at left are proportionally accurate. Which tree should you paint taller?" }, { "from": "gpt", "value": "The silhouette tree at upper center should be painted taller because it has a greater height compared to the silhouette leafy tree at left according to the description." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dce41ec69653d623.jpg", "conversations": [ { "from": "human", "value": "\nWhat is the 2D location of white shirt at right? Please provide its 2D coordinates." }, { "from": "gpt", "value": "[(0.787, 0.578)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1e4a279bfc32412.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue water at center have a smaller size compared to blue glossy pool at lower left?" }, { "from": "gpt", "value": "No, blue water at center is not smaller than blue glossy pool at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03437236d40b59ac.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fabric at upper left appear on the right side of smooth beige hand at center?" }, { "from": "gpt", "value": "In fact, white fabric at upper left is to the left of smooth beige hand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cd9d72449ccf626.jpg", "conversations": [ { "from": "human", "value": "\nLocate all white glossy sedan at center in the image." }, { "from": "gpt", "value": "[(0.667, 0.934)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/388694245f9f0506.jpg", "conversations": [ { "from": "human", "value": "\nWhich is above, black polished gondola at left or matte black hair at center?" }, { "from": "gpt", "value": "matte black hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b39d4352de90376.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these two, green needle-like at left or yellow matte flower at center, stands shorter?" }, { "from": "gpt", "value": "Standing shorter between the two is yellow matte flower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fc96040fc24c97d.jpg", "conversations": [ { "from": "human", "value": "\nHow far away is point (0.684, 0.734) from camera?" }, { "from": "gpt", "value": "4.86 feet" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a125b3ed4e7a1a9e.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a pink leather top at center. Pinpoint a point to the pink leather top at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.726, 0.853)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba447ff8df033c04.jpg", "conversations": [ { "from": "human", "value": "\nMeasure the distance between metallic silver stroller at center-right and camera." }, { "from": "gpt", "value": "metallic silver stroller at center-right and camera are 61.63 meters apart." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c030f98050de5319.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.278, 0.755) behind point (0.540, 0.509)?" }, { "from": "gpt", "value": "That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0f8ef1d0c5bca01.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.693, 0.778) come farther from viewer compared to point (0.710, 0.616)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7240791951796160.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light blue denim shirt at center is positioned to the right of dark blue shirt at center?" }, { "from": "gpt", "value": "Incorrect, light blue denim shirt at center is not on the right side of dark blue shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ec9f28246aa2534.jpg", "conversations": [ { "from": "human", "value": "\nIs neutral fabric couch at center to the right of dark wood stairs at lower right from the viewer's perspective?" }, { "from": "gpt", "value": "Incorrect, neutral fabric couch at center is not on the right side of dark wood stairs at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa3c107667441fa5.jpg", "conversations": [ { "from": "human", "value": "\nBetween velvet floral top at center and white satin jumpsuit at center, which one has more height?" }, { "from": "gpt", "value": "white satin jumpsuit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49f0cdc3b0c372b1.jpg", "conversations": [ { "from": "human", "value": "\nYou are a photographer at the themed area. You need to capture a photo of the two children interacting with Alice. The polka dot skirt at left and the black dotted fabric dress at left are both in the frame. Which child is positioned more to the left side of the photo?" }, { "from": "gpt", "value": "The polka dot skirt at left is positioned to the left of the black dotted fabric dress at left, so the child wearing the polka dot skirt at left is more to the left side of the photo." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7623f228c443cd61.jpg", "conversations": [ { "from": "human", "value": "\nIn the image, there is a matte orange robe at center. Pinpoint a point to the matte orange robe at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be rounded to three decimal places, indicating the absolute pixel location of the point in the image." }, { "from": "gpt", "value": "[(0.378, 0.775)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d247a656a65c99b.jpg", "conversations": [ { "from": "human", "value": "\nIs brushed metal fire truck at left thinner than metallic rectangular at upper center?" }, { "from": "gpt", "value": "In fact, brushed metal fire truck at left might be wider than metallic rectangular at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e01795ff61f3ca9.jpg", "conversations": [ { "from": "human", "value": "\nLocate the rocky stone waterfall at center in the image." }, { "from": "gpt", "value": "[(0.547, 0.819)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7330b4f126192a81.jpg", "conversations": [ { "from": "human", "value": "\nDoes white plastic keyboard at center have a lesser height compared to white plastic mouse at lower right?" }, { "from": "gpt", "value": "In fact, white plastic keyboard at center may be taller than white plastic mouse at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5c72e4e5c5d2095.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue denim jeans at center is positioned below matte black podium at center?" }, { "from": "gpt", "value": "No, blue denim jeans at center is not below matte black podium at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba65eeb1f0520a20.jpg", "conversations": [ { "from": "human", "value": "\nChoose the point of olive green shirt at center. Your answer should be formatted as a tuple, i.e. [(x, y)], where the tuple contains the x and y coordinates of a point satisfying the conditions above. The coordinates should be between 0 and 1, indicating the normalized pixel location of the point." }, { "from": "gpt", "value": "[(0.337, 0.525)]" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa9dc0c7aad1ba27.jpg", "conversations": [ { "from": "human", "value": "\nWhat can be observed at (0.059, 0.572)?" }, { "from": "gpt", "value": "metallic silver fire truck at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a1c0e481d690e6d.jpg", "conversations": [ { "from": "human", "value": "\nBetween beige textured shell at center and brown textured shell at upper center, which one is positioned lower?" }, { "from": "gpt", "value": "beige textured shell at center is below." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/284077e70d5b2510.jpg", "conversations": [ { "from": "human", "value": "\nIs point (0.400, 0.405) closer to viewer compared to point (0.489, 0.517)?" }, { "from": "gpt", "value": "No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c51f1f947d37fdf6.jpg", "conversations": [ { "from": "human", "value": "\nDoes point (0.524, 0.934) come in front of point (0.416, 0.508)?" }, { "from": "gpt", "value": "Yes, it is in front of point (0.416, 0.508)." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/559a72911dd0d69b.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte bone at lower left have a smaller size compared to matte gray nose at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green matte bone at lower left is not smaller than matte gray nose at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8e38e3f2914a384.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny metallic car at lower center closer to the viewer compared to metallic silver car at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30e9db5daf0816a1.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown ribbed shirt at center thinner than sparkly silver buckle at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea51ea07ed56c54b.jpg", "conversations": [ { "from": "human", "value": "\nIs black plastic mixing console at center wider than black matte dress at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black plastic mixing console at center's width does not surpass black matte dress at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/445f7937ce2fe6be.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the white matte plate at center? Choose among these: (A) matte white shirt at center (B) tan wool blazer at center (C) matte black dress at center (D) matte black suit at upper left" }, { "from": "gpt", "value": "(B) tan wool blazer at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0cc312837c177797.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if purple matte wine glass at upper right is bigger than clear glass wine at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7dc0fb01dfe94f6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) smooth bark tree at center (B) rough stone hut at center (C) wooden door at center" }, { "from": "gpt", "value": "(A) smooth bark tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ee42329c5bcec90.jpg", "conversations": [ { "from": "human", "value": "\nIs light blue fabric umpire at center below blue textured uniform at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, light blue fabric umpire at center is not below blue textured uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e83aad9311196aa.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.707, 0.922) (B) (0.966, 0.914)" }, { "from": "gpt", "value": "(B) (0.966, 0.914)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1f50c667e73055b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green matte table at center (B) silver metallic computer at center" }, { "from": "gpt", "value": "(A) green matte table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f284f484ce74cdc1.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) rusty metal rail at lower right (B) green leafy weed at lower right" }, { "from": "gpt", "value": "(A) rusty metal rail at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/872b0a056b0a6863.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray suit at center is positioned below dark brown hair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dde05be212050157.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the black matte teapot at center from the following options: (A) white matte rice at lower center (B) green grassy hay at center (C) wooden table at center (D) white woven cloth at center?" }, { "from": "gpt", "value": "(C) wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/461321906204b076.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte forest at center below green matte tree at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, green matte forest at center is above green matte tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6414b08ba95a8b76.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.815, 0.706) (B) (0.722, 0.580) (C) (0.918, 0.802)" }, { "from": "gpt", "value": "(B) (0.722, 0.580)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/478357dcc4f16919.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.469, 0.109) (B) (0.979, 0.223)" }, { "from": "gpt", "value": "(B) (0.979, 0.223)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63a7e8784bf56ad8.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden mirror at center closer to the viewer compared to zebra-patterned fabric stool at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/262ba0e0179fc037.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the beach sand at center from the following options: (A) matte pink dress at center (B) striped cotton dress at center (C) white cotton shirt at center (D) red satin dress at center?" }, { "from": "gpt", "value": "(B) striped cotton dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a3b35b20b713ebc.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown cotton shirt at center appear under dark brown fabric headscarf at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, brown cotton shirt at center is not positioned below dark brown fabric headscarf at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74524448a9a4e328.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the black fabric shirt at upper left? Choose among these: (A) pink fur at center (B) black matte nose at center" }, { "from": "gpt", "value": "(B) black matte nose at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2aa9ffd059dc14b.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of smooth bark tree trunk at center in relation to green matte parrot at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59587dc9ba2740ed.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) metallic silver helmet at upper right (B) black matte motorcycle at center (C) white matte shirt at center (D) matte black helmet at center" }, { "from": "gpt", "value": "(A) metallic silver helmet at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0647dbdc13dab68.jpg", "conversations": [ { "from": "human", "value": "\nIs maroon fabric baseball cap at right thinner than shiny metallic eagle at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, maroon fabric baseball cap at right might be wider than shiny metallic eagle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed1d9f65b4bbb201.jpg", "conversations": [ { "from": "human", "value": "\nIs blue uniform at center positioned before blue hard hat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30c0fae7d5462f1f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if polished chrome pendant light at upper right is positioned below metallic glass pendant light at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, polished chrome pendant light at upper right is not positioned below metallic glass pendant light at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de73973263d3de63.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is gray textured dome at center located relative to green leafy tree at lower left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70c6835ed8c3bfc4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) rusty wood tree trunk at upper left (B) gray weathered wood at left" }, { "from": "gpt", "value": "(B) gray weathered wood at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4052e9e2ef988bd.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) green grassy field at lower center (B) black wires at upper center (C) dark green mountain at center" }, { "from": "gpt", "value": "(C) dark green mountain at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfacf18a5ed6cdf5.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown shorts at center come in front of light brown fabric headscarf at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3cc7ebed09664667.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of orange reflective vest at left in reference to white paper at lower right? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0464a1dafaa33d6d.jpg", "conversations": [ { "from": "human", "value": "\nIs blue cardboard box at center positioned at the back of silver metallic hand at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, blue cardboard box at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e90bc634117e17e7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white fluffy cat at center is thinner than white fluffy cat at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, white fluffy cat at center might be wider than white fluffy cat at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4c6c8f69447073b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.681, 0.495) (B) (0.019, 0.073)" }, { "from": "gpt", "value": "(B) (0.019, 0.073)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/654e7239aa609162.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) light blue shirt at center (B) light brown hair at lower right (C) white paper sign at center" }, { "from": "gpt", "value": "(A) light blue shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1459cdefba1e51a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) silver metallic stroller at center (B) black leather handbag at right" }, { "from": "gpt", "value": "(A) silver metallic stroller at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/027f4744cb95cb85.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.033, 0.770) (B) (0.273, 0.420) (C) (0.401, 0.658)" }, { "from": "gpt", "value": "(A) (0.033, 0.770)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1985078252f39b11.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.448, 0.978) (B) (0.523, 0.103)" }, { "from": "gpt", "value": "(A) (0.448, 0.978)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ce7970658d31204.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.634, 0.567) (B) (0.657, 0.973)" }, { "from": "gpt", "value": "(B) (0.657, 0.973)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31a125ce6b4b64cf.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) shiny blue football player at center (B) white jersey at center" }, { "from": "gpt", "value": "(A) shiny blue football player at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63c5f5424570e71c.jpg", "conversations": [ { "from": "human", "value": "\nIs denim jacket at center behind matte black jacket at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98e0f9cefc6d6629.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.292, 0.731) (B) (0.495, 0.461)" }, { "from": "gpt", "value": "(A) (0.292, 0.731)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7fb62e02ae76513.jpg", "conversations": [ { "from": "human", "value": "\nDoes pinkish salmon at grill front have a greater width compared to golden brown salmon at grill front? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adb18167f02a8823.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) white cotton shirt at right (B) striped shirt at center" }, { "from": "gpt", "value": "(B) striped shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74f7d07bd4d57585.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) smooth glass tower at upper center (B) brown stone tower at upper left" }, { "from": "gpt", "value": "(A) smooth glass tower at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5696a594d90f231e.jpg", "conversations": [ { "from": "human", "value": "\nIs translucent plastic cup at center further to camera compared to white dotted shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, translucent plastic cup at center is in front of white dotted shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01e3800aff37062d.jpg", "conversations": [ { "from": "human", "value": "\nIs black knitted sweater at upper right bigger than blue t-shirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black knitted sweater at upper right is not larger than blue t-shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbe3f2a7d495e38e.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte ice cream cone at upper center appear over pink matte hand at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1816e6cd9d2fda31.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green leafy tree at upper center in relation to green leafy water at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9f43d2f137ee28a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.311, 0.394) (B) (0.884, 0.386)" }, { "from": "gpt", "value": "(A) (0.311, 0.394)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c57571e48c14e418.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow matte bicycle at center is wider than white glossy bicycle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/000559da530cd6eb.jpg", "conversations": [ { "from": "human", "value": "\nIs checkered fabric shirt at center above light blue denim jeans at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, checkered fabric shirt at center is positioned over light blue denim jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/182c066f68c4292e.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown sandy dirt field at center have a larger size compared to white corrugated metal hut at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, brown sandy dirt field at center is larger in size than white corrugated metal hut at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3dd38eee82e25ba.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) white glossy boat at center (B) green leafy tree at left" }, { "from": "gpt", "value": "(A) white glossy boat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c27ed8a3386a7d07.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) white plastic toilet bowl at center (B) white glossy sink at center (C) matte white faucet at upper center (D) pink knitted tablecloth at lower left, is positioned closest to the satin silver faucet at center?" }, { "from": "gpt", "value": "(C) matte white faucet at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a7d2dd95cc0a720.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red jacket at center have a larger size compared to black matte bicycle helmet at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8a7711f72a708eb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) silver metallic camcorder at upper right (B) white fabric shirt at upper left" }, { "from": "gpt", "value": "(B) white fabric shirt at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e1dced2d50c1fc9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) shiny red car at center (B) hawaiian shirt at center (C) blue cotton t-shirt at center (D) yellow metallic car at center" }, { "from": "gpt", "value": "(A) shiny red car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51e63bbf350634e0.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of brown stone fountain at center and green leafy tree at right in the image provided, where is brown stone fountain at center located with respect to green leafy tree at right? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a45a32504594a360.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at lower center is thinner than matte brown couple at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, green grass at lower center's width is not less than matte brown couple at lower right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df1520149234ed9a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.137, 0.536) (B) (0.268, 0.430) (C) (0.841, 0.384) (D) (0.199, 0.431)" }, { "from": "gpt", "value": "(A) (0.137, 0.536)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf95f19038d05bf8.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green leafy palm tree at left (B) green leafy palm tree at upper center (C) green leafy coconut tree at center" }, { "from": "gpt", "value": "(B) green leafy palm tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0a18e608644655d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte blue cushion at center is positioned to the right of wooden table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte blue cushion at center is not on the right side of wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d86241e088aa239.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) blue polished wood pirate ship at center (B) clear water at lower center" }, { "from": "gpt", "value": "(B) clear water at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1206b6110bbdc750.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the green striped tie at center among (A) red fabric coat at left (B) tan textured suit at center (C) black suit at center (D) blue striped tie at center?" }, { "from": "gpt", "value": "(A) red fabric coat at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/032c232cf04076c8.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of rough concrete block at center more distant than that of black glossy magpie at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a8564090e028f04.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.087, 0.431) (B) (0.813, 0.438)" }, { "from": "gpt", "value": "(A) (0.087, 0.431)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ed569da96012376.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dark green textured tree at left (B) snowy mountain at center (C) brown dry grass at center" }, { "from": "gpt", "value": "(B) snowy mountain at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32269ae705f9405c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if teal fabric clothing at center is smaller than metallic pole at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, teal fabric clothing at center is smaller than metallic pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac9c86ebb492dbce.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the green leafy trees at center among (A) green leafy trees at right (B) brown muddy water at center?" }, { "from": "gpt", "value": "(B) brown muddy water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b1bc5d9f25c117c.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white cotton socks at left and purple cotton dress at center in the image provided, where is white cotton socks at left located with respect to purple cotton dress at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c385fbc31b29114.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brown wooden rail at left (B) green mossy bark tree at left" }, { "from": "gpt", "value": "(B) green mossy bark tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6111ebe505f6a3fa.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy island at center bigger than white sailboat at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green leafy island at center is bigger than white sailboat at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad3bfd3646af418a.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte gray jacket at left have a greater width compared to matte black goggles at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, matte gray jacket at left has a greater width compared to matte black goggles at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/904a2e3168382375.jpg", "conversations": [ { "from": "human", "value": "\nDoes khaki shorts at center lie behind matte black tank top at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/959536aee8c19d2c.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the brown dirt path at center among (A) green mossy hillside at left (B) brown bark tree at upper left?" }, { "from": "gpt", "value": "(B) brown bark tree at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0796db7ddc0dcb4b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) beige fabric trench coat at center (B) leather textured briefcase at center (C) silver metallic train at center" }, { "from": "gpt", "value": "(B) leather textured briefcase at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a515833411f05267.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is muddy green t-shirt at center located relative to matte gray t-shirt at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/203aec3694386c5d.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth concrete pavement at center closer to the viewer compared to light beige coat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, smooth concrete pavement at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a99baf42b518d59e.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of dark blue water at center and metallic silver mast at right in the image provided, where is dark blue water at center located with respect to metallic silver mast at right? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d00e574d7449ab42.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.698, 0.720) (B) (0.789, 0.180)" }, { "from": "gpt", "value": "(B) (0.789, 0.180)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/871f49d122fdf7e5.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of matte yellow school bus at center more distant than that of yellow matte license plate at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eac21fcbdef955f5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.482, 0.500) (B) (0.192, 0.739)" }, { "from": "gpt", "value": "(B) (0.192, 0.739)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd05b2424e662c31.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the dark brown hair at center? Choose among these: (A) blue fabric shirt at lower left (B) matte gray seat at lower left" }, { "from": "gpt", "value": "(B) matte gray seat at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08467b3385cafd26.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green scaly lizard at center (B) green scaly tail at center" }, { "from": "gpt", "value": "(A) green scaly lizard at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78eb5879d5e1299d.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped shirt at lower left appear under white shirt at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, striped shirt at lower left is above white shirt at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7415eb078dbb5b3b.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte t-shirt at center bigger than dark brown leather jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4109e6dd0d0c1902.jpg", "conversations": [ { "from": "human", "value": "\nIs white polka dot fabric umbrella at center wider than red fabric stool at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white polka dot fabric umbrella at center is wider than red fabric stool at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85d2228d227239df.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.281, 0.389) (B) (0.435, 0.994)" }, { "from": "gpt", "value": "(A) (0.281, 0.389)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d388034f8cd5ce24.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the yellow fabric blanket at center? Choose from: (A) dark blue leather shoe at lower center (B) matte black shorts at center" }, { "from": "gpt", "value": "(B) matte black shorts at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8d5d412cd0f9212.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light brown skin at center is positioned to the left of brown furry foot at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, light brown skin at center is to the right of brown furry foot at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30c681411416c580.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte pink shirt at center (B) blue reflective sunglasses at center (C) pink fabric shirt at center (D) brown cardboard sign at upper center" }, { "from": "gpt", "value": "(C) pink fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e87b3dc35faff09.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) dark wool coat at left (B) white plastic license plate at center" }, { "from": "gpt", "value": "(B) white plastic license plate at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2635f9ae04cd90b2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.148, 0.708) (B) (0.258, 0.936)" }, { "from": "gpt", "value": "(A) (0.148, 0.708)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5ba9e0f9e0fa440.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy trees at right below white glossy boat at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, green leafy trees at right is above white glossy boat at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b973371fdb23646d.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the green matte jacket at center from the following options: (A) blue denim jeans at left (B) green fabric shirt at lower right?" }, { "from": "gpt", "value": "(B) green fabric shirt at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fcb70216be6a080.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green textured cypress tree at center (B) blue translucent water at center (C) rough textured rock at lower right" }, { "from": "gpt", "value": "(C) rough textured rock at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c36fee44d0007bd.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) dark gray hoodie at left (B) metallic chain-link fence at center-left" }, { "from": "gpt", "value": "(A) dark gray hoodie at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ffdcb46cd68626a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) brown wooden gazebo at upper right (B) green leafy tree at upper center" }, { "from": "gpt", "value": "(B) green leafy tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49e6d51155587f3f.jpg", "conversations": [ { "from": "human", "value": "\nDoes white knitted sweater at center appear on the right side of white cloth at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white knitted sweater at center is positioned on the right side of white cloth at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/962ca50b060cba9d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at center is positioned to the right of white matte van at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green grass at center is not to the right of white matte van at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60f72be49c3ae85c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.089, 0.953) (B) (0.394, 0.758) (C) (0.620, 0.534)" }, { "from": "gpt", "value": "(A) (0.089, 0.953)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55153531acdfc66d.jpg", "conversations": [ { "from": "human", "value": "\nDoes green glass door at center appear under matte purple signboard at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green glass door at center is positioned under matte purple signboard at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e0aab1e41f5599b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the white soft pillow at center? Select from: (A) fluffy white pillow at center (B) patterned fabric couch at center" }, { "from": "gpt", "value": "(A) fluffy white pillow at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcedc4bcd9d0c333.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red uniform at center is positioned to the right of black reflective uniform at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, red uniform at center is not to the right of black reflective uniform at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9eab29bb78e09f0.jpg", "conversations": [ { "from": "human", "value": "\nDoes white feather boa at left come in front of blonde feather boa at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b955fff68d022a1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.724, 0.922) (B) (0.912, 0.622)" }, { "from": "gpt", "value": "(A) (0.724, 0.922)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d3c5b9d4555e533.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.321, 0.608) (B) (0.514, 0.658) (C) (0.617, 0.467)" }, { "from": "gpt", "value": "(A) (0.321, 0.608)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d6c46125e285ecb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue water at center is positioned below dark gray metallic boat at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53f50bea771570ea.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) gold metallic sculpture at center (B) green leafy tree at center (C) matte white sculpture at upper center" }, { "from": "gpt", "value": "(A) gold metallic sculpture at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f6d575ae687fdc9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) olive-green fabric jacket at center-right (B) metallic traffic light at upper center (C) dark blue leather jacket at center (D) leather jacket at center, is positioned closest to the smooth concrete sidewalk at center?" }, { "from": "gpt", "value": "(D) leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a510c42d0be57f8.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte van at left have a lesser width compared to soft blue fabric at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1561ca2711be8010.jpg", "conversations": [ { "from": "human", "value": "\nIs blue satin regalia at center bigger than brown leather vest at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, blue satin regalia at center is not larger than brown leather vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3e4e1124ae3908e.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black signboard at center to the left of black paper at lower right from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, matte black signboard at center is positioned on the left side of black paper at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cafac16259b33884.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black backpack at left positioned before orange fabric shirt at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0522fce6788f273e.jpg", "conversations": [ { "from": "human", "value": "\nDoes cardboard bear at upper center have a lesser width compared to black matte car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, cardboard bear at upper center might be wider than black matte car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/952e7b4c05aff6a5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the dirt field at lower center? Select from: (A) brown cotton shirt at lower left (B) brown fabric pants at lower center (C) light blue shirt at center" }, { "from": "gpt", "value": "(C) light blue shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d81fbc4b66c0fc1.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is camouflage fabric uniform at center located relative to brown wooden table at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b44dda616f1fa89a.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grassy pasture at center have a larger size compared to brown glossy horse at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green grassy pasture at center has a larger size compared to brown glossy horse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7aa0798e04b265e8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white glass door at center (B) brown wood tree at upper center" }, { "from": "gpt", "value": "(B) brown wood tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11d68f6ede4d79ca.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at left to the right of wooden cabin at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green leafy tree at left is not to the right of wooden cabin at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c22308a6ea931d09.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the black hair at lower center among (A) dark hair at center (B) smooth glossy red pole at left?" }, { "from": "gpt", "value": "(B) smooth glossy red pole at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c345b2e88d1b2ebe.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black jacket at center have a lesser width compared to leather jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, matte black jacket at center has a lesser width compared to leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ace2e9ed593aec77.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.295, 0.578) (B) (0.006, 0.244)" }, { "from": "gpt", "value": "(B) (0.006, 0.244)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49f015b5a48f07ae.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.474, 0.908) (B) (0.259, 0.367) (C) (0.679, 0.787) (D) (0.075, 0.588)" }, { "from": "gpt", "value": "(C) (0.679, 0.787)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/137c5b196e035d81.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte golf cart at center lie behind matte blue shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c45728072111097.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if camouflage fabric uniform at center is wider than matte black rifle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, camouflage fabric uniform at center is not wider than matte black rifle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5eeec5919733245.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue denim shirt at left have a larger size compared to dark green uniform at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fc3607a3e78c796.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red shirt at center positioned in front of dark blue jeans at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94a9252108da41a9.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white satin shirt at center located in relation to matte red jacket at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef5972fad4674ea9.jpg", "conversations": [ { "from": "human", "value": "\nWhere is blue cotton shirt at center located in relation to light beige fabric newborn at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63aafcb90335e91c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.154, 0.886) (B) (0.123, 0.900)" }, { "from": "gpt", "value": "(B) (0.123, 0.900)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1ac12fd88952c2f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) dark green leafy tree at lower center (B) green leafy tree at left (C) transparent glass building at right (D) transparent glass tower at center" }, { "from": "gpt", "value": "(B) green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57dcb3d4f2e7b1f7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the nail polish at center? Select from: (A) smooth silver coin at center (B) silver polished coin at center" }, { "from": "gpt", "value": "(B) silver polished coin at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d270da259ecc2b1d.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the black ribbed water tower at center among (A) black ribbed water tank at center (B) dull brown dirt at center (C) gray concrete hut at left?" }, { "from": "gpt", "value": "(C) gray concrete hut at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c6abb7382999ab7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray cotton hoodie at center is smaller than yellow matte apple at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, gray cotton hoodie at center is not smaller than yellow matte apple at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8b74ee7be08087e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) golden brown crusty pizza at center (B) matte red robe at upper left (C) black matte shirt at center (D) matte red robe at lower right" }, { "from": "gpt", "value": "(A) golden brown crusty pizza at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77d2f6773bcd826d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the green matte tree at center? (A) gray gravel train track at center (B) green leafy tree at upper left (C) white matte train at center" }, { "from": "gpt", "value": "(A) gray gravel train track at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3bbc1757e3f3646.jpg", "conversations": [ { "from": "human", "value": "\nDoes red fabric umbrella at upper left appear on the left side of metallic folding chair at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, red fabric umbrella at upper left is to the left of metallic folding chair at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ff23fb66adab33c.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at lower left bigger than green plastic brush at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/112732a06311de59.jpg", "conversations": [ { "from": "human", "value": "\nDoes black suit at center appear on the right side of dark gray suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, black suit at center is positioned on the right side of dark gray suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23d81dbfe84c9d99.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the denim jacket at lower right among (A) matte brown leather jacket at center (B) black matte uniform at center?" }, { "from": "gpt", "value": "(A) matte brown leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89e81223b531f9e7.jpg", "conversations": [ { "from": "human", "value": "\nIs gray fabric shirt at center thinner than white matte pants at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, gray fabric shirt at center has a lesser width compared to white matte pants at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adef8a6a831cea33.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny multicolored parrot at center below green glossy parrot at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de357bfd7d3a621e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) green textured pine tree at left (B) green leafy tree at upper center (C) green textured pine tree at center (D) green grassy at center" }, { "from": "gpt", "value": "(A) green textured pine tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee48ce8130303736.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.099, 0.314) (B) (0.538, 0.734)" }, { "from": "gpt", "value": "(A) (0.099, 0.314)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/960895739fac1761.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of blue fabric playpen at center less distant than that of blue mesh playpen at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, blue fabric playpen at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a951da539092f095.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny red car at lower center to the left of matte white clock at upper center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, shiny red car at lower center is not to the left of matte white clock at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6467f323f47d9ae4.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the light gray fabric shirt at lower right among (A) plaid fabric skateboarder at right (B) smooth concrete alley at center?" }, { "from": "gpt", "value": "(A) plaid fabric skateboarder at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10982ab6e08fb723.jpg", "conversations": [ { "from": "human", "value": "\nDoes stone tower at center appear under matte green t-shirt at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, stone tower at center is positioned under matte green t-shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d65b54624f76c250.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte jacket at center have a smaller size compared to plaid shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, black matte jacket at center occupies less space than plaid shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef64fd3d2ae1a0c1.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.113, 0.767) (B) (0.770, 0.427)" }, { "from": "gpt", "value": "(A) (0.113, 0.767)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05a645fddf7578ef.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) black glossy limousine at center (B) matte black suit at center (C) dark blue suit at center" }, { "from": "gpt", "value": "(B) matte black suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98dcbdf2bbf9cab7.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow matte doll at center appear on the right side of glossy plastic table at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, yellow matte doll at center is positioned on the right side of glossy plastic table at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b580be34ae81da78.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) light wood acoustic guitar at upper center (B) tabby fur cat at upper right (C) red textured pillow at upper right" }, { "from": "gpt", "value": "(A) light wood acoustic guitar at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/230546dbb834996c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.452, 0.445) (B) (0.219, 0.425)" }, { "from": "gpt", "value": "(B) (0.219, 0.425)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff5999e96f692bf7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.466, 0.448) (B) (0.034, 0.909)" }, { "from": "gpt", "value": "(B) (0.034, 0.909)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3b532a36186fae7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) metallic silver bicycle at center (B) shiny silver bicycle at center" }, { "from": "gpt", "value": "(B) shiny silver bicycle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/613af67ac00a0956.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.107, 0.636) (B) (0.169, 0.400)" }, { "from": "gpt", "value": "(B) (0.169, 0.400)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0855b3672c4e6cc4.jpg", "conversations": [ { "from": "human", "value": "\nIs brown glossy holstein-friesian at center to the right of brown glossy jersey cow at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, brown glossy holstein-friesian at center is positioned on the right side of brown glossy jersey cow at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f1532e284041b75.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of light blue lace shorts at center in relation to green fabric shirt at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0a5f8f701ec9a83.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of orange fabric jacket at center in reference to matte black jacket at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36737631f11e5ea4.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the black fabric jacket at center from the following options: (A) black matte suit at lower left (B) matte black suit at center?" }, { "from": "gpt", "value": "(A) black matte suit at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3d300df18e0de67.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark wood armchair at center is positioned to the right of brown leather armchair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, dark wood armchair at center is to the left of brown leather armchair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63a48e7065d09126.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) smooth gray stones at left (B) gray smooth rock at lower right" }, { "from": "gpt", "value": "(B) gray smooth rock at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/767df651822374e9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte brown magazine at lower right (B) matte cardboard magazine at lower left (C) matte paper magazine at center" }, { "from": "gpt", "value": "(B) matte cardboard magazine at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d2c046a42e63753.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.807, 0.637) (B) (0.446, 0.623)" }, { "from": "gpt", "value": "(B) (0.446, 0.623)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b180b5ce354df4b.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fluffy dog at center have a greater width compared to green leafy plant at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white fluffy dog at center's width does not surpass green leafy plant at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4c666f53fde9de7.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black megaphone at center have a larger size compared to multicolored feathered hat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte black megaphone at center is bigger than multicolored feathered hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bffa675222f9edc6.jpg", "conversations": [ { "from": "human", "value": "\nIs striped shirt at center wider than translucent plastic cup at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, striped shirt at center is wider than translucent plastic cup at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8bd9d5ab0380394.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.735, 0.867) (B) (0.286, 0.567) (C) (0.260, 0.334) (D) (0.018, 0.495)" }, { "from": "gpt", "value": "(A) (0.735, 0.867)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/768da1e7dfd85e0f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the white paper poster at upper right? Select from: (A) black plastic swivel chair at lower center (B) blue fabric swivel chair at lower right (C) orange paper poster at upper center" }, { "from": "gpt", "value": "(A) black plastic swivel chair at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13ffa6ffcaac2c1d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.775, 0.450) (B) (0.820, 0.167)" }, { "from": "gpt", "value": "(A) (0.775, 0.450)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3466644e75dc0329.jpg", "conversations": [ { "from": "human", "value": "\nDoes black velvet dress at center have a greater width compared to pink satin dress at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, black velvet dress at center might be narrower than pink satin dress at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7f004526787aa4c.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the metallic yellow crane arm at center from the following options: (A) white metallic truck at lower right (B) white metallic crane at center (C) yellow metallic crane at center (D) matte black truck at lower left?" }, { "from": "gpt", "value": "(D) matte black truck at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e3beba5e216da65.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) camouflage uniform at center (B) black matte t-shirt at left" }, { "from": "gpt", "value": "(A) camouflage uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0a3ee463f035b94.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black matte t-shirt at left located in relation to blue satin tank top at upper right in the image? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71ff6502d142d1b8.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy bikini at center to the right of white matte bikini at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, white glossy bikini at center is to the left of white matte bikini at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/961808ce2fed3e28.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) silver metallic van at center (B) white matte car at center" }, { "from": "gpt", "value": "(A) silver metallic van at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dde2bc4837cad8f6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green plastic ball at upper left is thinner than white matte snowman at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, green plastic ball at upper left might be wider than white matte snowman at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed7012e06416b40f.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red sweater at center thinner than brown paper bag at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte red sweater at center is thinner than brown paper bag at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48139b284a0a0e7e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black plastic ruler at bottom is positioned to the left of gold/yellow metal ring at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, black plastic ruler at bottom is not to the left of gold/yellow metal ring at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b1591f18ff1f889.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte white lamp at upper center have a greater width compared to matte black coffee table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa640bee8088ed56.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.626, 0.545) (B) (0.727, 0.341) (C) (0.540, 0.200) (D) (0.434, 0.339)" }, { "from": "gpt", "value": "(B) (0.727, 0.341)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5da095b5771c630d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dull brown mud at center is positioned below yellow metallic excavator at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6322f986ecffe262.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.031, 0.512) (B) (0.742, 0.425)" }, { "from": "gpt", "value": "(A) (0.031, 0.512)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a5e88f3c32f21bb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green algae at lower center (B) green leafy trees at center" }, { "from": "gpt", "value": "(A) green algae at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe4934bb3e2f0b8f.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue matte tank top at center appear over matte blue tank top at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03b10634112b75d5.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink checkered shirt at left appear on the left side of brushed metal bag at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, pink checkered shirt at left is to the left of brushed metal bag at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22401f49491af7f4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) matte yellow building at center (B) yellow matte building at left" }, { "from": "gpt", "value": "(B) yellow matte building at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26b4ea56567ff12b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) black floral top at right (B) green fabric jacket at center (C) matte black suit at center" }, { "from": "gpt", "value": "(C) matte black suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1af83b0c650ab297.jpg", "conversations": [ { "from": "human", "value": "\nDoes light green t-shirt at center have a smaller size compared to smooth white paper at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, light green t-shirt at center is not smaller than smooth white paper at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/136ff41bb1699ad2.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white printed t-shirt at center (B) green matte shorts at lower left" }, { "from": "gpt", "value": "(B) green matte shorts at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57d64c3f28f81e8e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the dark blue jeans at center? (A) dark gray wool coat at center (B) patterned fabric coat at center (C) beige fabric coat at center" }, { "from": "gpt", "value": "(A) dark gray wool coat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1842181103c96755.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the tan canvas backpack at center? (A) brown canvas backpack at center (B) brown leather hat at upper center (C) green canvas tent at left" }, { "from": "gpt", "value": "(A) brown canvas backpack at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f4b41c2c8620bb3.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is brown matte bison at center located relative to light brown matte yak at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a63084403edc62af.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) brown stone hillside at lower right (B) brown stone village at center" }, { "from": "gpt", "value": "(B) brown stone village at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f1537b33b68c2b3.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of rugged stone cliff at center and blue/yellow fabric life vest at center in the image provided, where is rugged stone cliff at center located with respect to blue/yellow fabric life vest at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c42d9b675943654c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) white glossy oven at center (B) polished stainless steel kettle at right (C) black plastic coffee maker at right (D) brown granite countertop at lower right" }, { "from": "gpt", "value": "(B) polished stainless steel kettle at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ddb9177cceb7640.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of silver metallic handgun at center right and polished metal handgun at center in the image provided, where is silver metallic handgun at center right located with respect to polished metal handgun at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2de57fba73399737.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) matte blue jacket at center (B) green fabric jacket at center (C) wooden bridge at center" }, { "from": "gpt", "value": "(C) wooden bridge at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac3daafc3cf7127a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.578, 0.438) (B) (0.858, 0.452) (C) (0.821, 0.398) (D) (0.644, 0.402)" }, { "from": "gpt", "value": "(D) (0.644, 0.402)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44a3e95ad66bea65.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) yellow fabric backpack at left (B) rough stone mountain at center (C) purple matte backpack at center" }, { "from": "gpt", "value": "(B) rough stone mountain at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/178526c49dc76015.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the green fleece hat at center? (A) gray cotton shirt at center (B) pearl necklace at upper center" }, { "from": "gpt", "value": "(A) gray cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b1589d5dd81ec78.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the matte white paper bag at center? (A) translucent plastic candy at center (B) black shirt at left (C) pink fabric dress at lower left (D) gray cotton shirt at center" }, { "from": "gpt", "value": "(D) gray cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6919fab40a344c22.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) patterned fabric arm at center (B) white matte camera at upper center (C) patterned fabric shirt at center (D) matte black flashlight at upper center" }, { "from": "gpt", "value": "(B) white matte camera at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c322d7a6934777e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if silver metallic sedan at right is smaller than white matte car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, silver metallic sedan at right is not smaller than white matte car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e8885f16befb451.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if transparent water at center is positioned below black matte container ship at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, transparent water at center is located below black matte container ship at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/440a95e0d149e696.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the gray fleece jacket at center? (A) black zip-up sweater at center (B) black smooth arm at center (C) white fuzzy beard at center" }, { "from": "gpt", "value": "(A) black zip-up sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc73d8b8558e53f9.jpg", "conversations": [ { "from": "human", "value": "\nDoes white satin dress at center have a greater width compared to white smooth shirt at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, white satin dress at center might be narrower than white smooth shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ceff7e2e7b06d91.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) red velvet dress at center (B) fuzzy brown monkey at center" }, { "from": "gpt", "value": "(B) fuzzy brown monkey at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d36e34560ba508b.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green grass at lower right in relation to gray matte bird at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f270a82cfb9cdbe.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown cobblestone pavement at center appear on the left side of white paper poster at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, brown cobblestone pavement at center is not to the left of white paper poster at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19bb0460396580cb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if pink frosted cake at center is thinner than smooth plastic toy soldier at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, pink frosted cake at center might be wider than smooth plastic toy soldier at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c0325237275cd33.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green matte shirt at center and blue jeans at center in the image provided, where is green matte shirt at center located with respect to blue jeans at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04bbe9d35c50ab91.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.710, 0.620) (B) (0.328, 0.339) (C) (0.951, 0.430) (D) (0.423, 0.877)" }, { "from": "gpt", "value": "(D) (0.423, 0.877)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e293dc0effb2615.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown leather jacket at lower right smaller than green matte shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39217563fb00c495.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green leafy tree at upper center and green leafy tree at upper left in the image provided, where is green leafy tree at upper center located with respect to green leafy tree at upper left? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0042699f729f9c08.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green glossy parrot at left located in relation to shiny orange parrot at center in the image? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a572fdc479b41de7.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the green copper spire at upper center among (A) green copper roof at center (B) cobblestone alley at center (C) metallic gold clock at center (D) green copper tower at center?" }, { "from": "gpt", "value": "(D) green copper tower at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4a4a6be159304c3.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte black t-shirt at center located in relation to black plastic sunglasses at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f3be6e01bda9980.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green leafy trees at center (B) black volcanic rocks at lower left (C) green leafy palm tree at upper left (D) dark blue water at lower right" }, { "from": "gpt", "value": "(B) black volcanic rocks at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/948d8991c4f66ecb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.930, 0.927) (B) (0.903, 0.417)" }, { "from": "gpt", "value": "(A) (0.930, 0.927)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3990a4b81c7aac34.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if satin silver minivan at lower left is positioned to the right of metallic silver car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, satin silver minivan at lower left is not on the right side of metallic silver car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36efec3badc3ad7e.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden podium at center appear on the right side of purple satin vest at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, wooden podium at center is positioned on the right side of purple satin vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9a4175f843d957c.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte black leather jacket at left in relation to glossy leather boot at lower left? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c0bf28245a64c95.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.143, 0.870) (B) (0.235, 0.614)" }, { "from": "gpt", "value": "(B) (0.235, 0.614)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5117b754613a09a9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.555, 0.659) (B) (0.703, 0.250) (C) (0.470, 0.416) (D) (0.008, 0.452)" }, { "from": "gpt", "value": "(D) (0.008, 0.452)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f599263a2f8081b.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the golden crunchy nuts at table right among (A) dark gray shirt at upper center (B) white plastic table at lower right?" }, { "from": "gpt", "value": "(A) dark gray shirt at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0300a2a9534d460f.jpg", "conversations": [ { "from": "human", "value": "\nDoes green rough bark tree at center have a greater width compared to brown sandy dirt track at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green rough bark tree at center is wider than brown sandy dirt track at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43327fd6201b9403.jpg", "conversations": [ { "from": "human", "value": "\nIs oil painting at right in front of polished dark wood bench at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, oil painting at right is in front of polished dark wood bench at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/931d598f3322f560.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte black shirt at left (B) smooth gray shirt at lower right" }, { "from": "gpt", "value": "(B) smooth gray shirt at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99389d5625e1d6e3.jpg", "conversations": [ { "from": "human", "value": "\nDoes brick pavement at center have a lesser width compared to green glossy leafy plant at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47265166aa6b8d45.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black paper at center is wider than translucent glass beer at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, black paper at center has a greater width compared to translucent glass beer at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/baa2bab61a31f7b0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.435, 0.528) (B) (0.673, 0.470) (C) (0.069, 0.823)" }, { "from": "gpt", "value": "(B) (0.673, 0.470)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/924774f5cf958b18.jpg", "conversations": [ { "from": "human", "value": "\nIs black glossy cruise ship at center below skinny man at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8731823ee578090.jpg", "conversations": [ { "from": "human", "value": "\nIs gray stone pavement at center wider than black cardboard sign at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, gray stone pavement at center is wider than black cardboard sign at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78a07eec9ebedc24.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) brown woolen sheep at center (B) brown woolen sweater at left" }, { "from": "gpt", "value": "(A) brown woolen sheep at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c421d89b7d39c201.jpg", "conversations": [ { "from": "human", "value": "\nIs black smooth hole at upper right smaller than smooth bark tree at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, black smooth hole at upper right is smaller than smooth bark tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b4e2098a2fcdb45.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) yellow leafy tree at center (B) brown liquid water at lower center" }, { "from": "gpt", "value": "(B) brown liquid water at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d075e269641e7e0c.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green grass at lower right located in relation to smooth concrete flood at left in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cdf57a0cf0be276.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) matte blue shirt at center (B) brown leather table at center (C) matte red sweater at center" }, { "from": "gpt", "value": "(C) matte red sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ba39f2ec6da7854.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the blue fabric shirt at right among (A) matte black jacket at upper left (B) white glossy table at center (C) black matte jacket at upper left?" }, { "from": "gpt", "value": "(B) white glossy table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59e0eb0a46657314.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green matte tree at center and snowy pine tree at center in the image provided, where is green matte tree at center located with respect to snowy pine tree at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f73946494af579f6.jpg", "conversations": [ { "from": "human", "value": "\nDoes white marble sculpture at center have a smaller size compared to white marble nude at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, white marble sculpture at center might be larger than white marble nude at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/865dfd126c05492b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) pink cotton polo shirt at center (B) black metal fence at center" }, { "from": "gpt", "value": "(A) pink cotton polo shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dffcd6f4c8782710.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the matte red blazer at upper center? Choose among these: (A) red matte shirt at upper center (B) fluffy white plush at lower left" }, { "from": "gpt", "value": "(A) red matte shirt at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6785adfeada450ad.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the shiny red soccer player at center? (A) blue jersey at lower left (B) blue matte jersey at upper center (C) shiny red jersey at center" }, { "from": "gpt", "value": "(B) blue matte jersey at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61c0832e49ec81ae.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the dark gray jacket at lower left? Choose among these: (A) dark gray jacket at center (B) black matte jacket at center" }, { "from": "gpt", "value": "(B) black matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd22341ce4fd6821.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) green mossy stump at center (B) green leafy fern at center" }, { "from": "gpt", "value": "(B) green leafy fern at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a00871769d71889f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.747, 0.759) (B) (0.410, 0.622) (C) (0.994, 0.714)" }, { "from": "gpt", "value": "(B) (0.410, 0.622)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/206a07264968ddd7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) black matte camera at upper right (B) black plastic lens at upper right" }, { "from": "gpt", "value": "(A) black matte camera at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f4f1c07ab959db3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.538, 0.341) (B) (0.178, 0.741) (C) (0.680, 0.933) (D) (0.713, 0.637)" }, { "from": "gpt", "value": "(A) (0.538, 0.341)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80d1af061a4ade59.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white matte shirt at center (B) silky white curtain at left (C) light blue shirt at center" }, { "from": "gpt", "value": "(B) silky white curtain at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9789c964a3e7368.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of matte gray tie at center in reference to plaid fabric tie at left? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0022aa7327636c98.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) white fabric thermometer at center (B) yellow fabric toy at center" }, { "from": "gpt", "value": "(B) yellow fabric toy at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1fb3f3e5fc16a0c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brown leather jacket at left (B) black plastic camera at center (C) gray fleece jacket at center (D) matte gray puffer jacket at center" }, { "from": "gpt", "value": "(A) brown leather jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b0464af6b1ffe71.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.704, 0.805) (B) (0.899, 0.619) (C) (0.751, 0.630)" }, { "from": "gpt", "value": "(C) (0.751, 0.630)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ceaf125ec7eb5021.jpg", "conversations": [ { "from": "human", "value": "\nDoes snow-covered branches at center have a smaller size compared to snow-covered tree at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, snow-covered branches at center might be larger than snow-covered tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63a459623fbaf000.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.642, 0.491) (B) (0.732, 0.083) (C) (0.068, 0.597) (D) (0.650, 0.759)" }, { "from": "gpt", "value": "(D) (0.650, 0.759)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60b62c9c52165cc4.jpg", "conversations": [ { "from": "human", "value": "\nWhere is shiny pink robe at center located in relation to matte black hand at upper left in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff144e913e1dc3a1.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of light blue cotton polo shirt at center and floral fabric dress at center in the image provided, where is light blue cotton polo shirt at center located with respect to floral fabric dress at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52d5f9057ab635dd.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if satin white dress at center is positioned below black lace dress at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, satin white dress at center is located below black lace dress at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d98887816617c33.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the green matte bus at center? (A) matte blue backpack at center (B) denim jacket at center (C) blue plastic sign at upper center (D) white cotton hat at center" }, { "from": "gpt", "value": "(D) white cotton hat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64decc282b1f63de.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black banner at upper center to the right of dark blue fabric at lower left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black banner at upper center is to the right of dark blue fabric at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ed71a4cce7122eb.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the concrete bridge at center? (A) green leafy tree at upper center (B) green leafy tree at upper left (C) green leafy tree at lower left (D) green leafy tree at upper right" }, { "from": "gpt", "value": "(A) green leafy tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95f4e6c337f5d308.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of blue nylon jacket at center less distant than that of blue fabric hand at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/057e6b2bcbda556f.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the rusty metal train car at left? Choose from: (A) rusty metal pole at right (B) brown wooden pole at center-right (C) smooth metallic pole at center (D) orange matte train at center" }, { "from": "gpt", "value": "(D) orange matte train at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9e8cdcf6ccd62d1.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.691, 0.839) (B) (0.708, 0.608) (C) (0.722, 0.681)" }, { "from": "gpt", "value": "(A) (0.691, 0.839)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35d1e9c52d7b6bd4.jpg", "conversations": [ { "from": "human", "value": "\nIs brown textured tree at left positioned in front of shiny metallic tower at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is in front of shiny metallic tower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58740c1c83f806d4.jpg", "conversations": [ { "from": "human", "value": "\nIs translucent misty water at center smaller than smooth brown tree at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, translucent misty water at center might be larger than smooth brown tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d1c87e9bf62b74e.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte purple skirt at left appear over blue textured fabric dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte purple skirt at left is not above blue textured fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0770b151595ea095.jpg", "conversations": [ { "from": "human", "value": "\nDoes stone inscription at center appear over green leafy palm tree at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, stone inscription at center is not above green leafy palm tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c664a773903798c1.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the black striped shirt at center? Choose from: (A) maroon jersey at center (B) black rubber hockey stick at center" }, { "from": "gpt", "value": "(A) maroon jersey at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22c0164cdf04ca45.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the camouflage uniform at center? (A) camouflage pants at center (B) camouflage boots at lower left" }, { "from": "gpt", "value": "(A) camouflage pants at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/049a096238c284df.jpg", "conversations": [ { "from": "human", "value": "\nDoes white metal stool at center appear over pink fabric doll at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white metal stool at center is not positioned above pink fabric doll at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22f08299aa80aced.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown dirt at lower center have a larger size compared to brown dry stalks at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/034ab3b0eac3fc4a.jpg", "conversations": [ { "from": "human", "value": "\nIs rocky cliff at center to the right of green leafy tree at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, rocky cliff at center is not to the right of green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b89c46fa9cc395d9.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the yellow fabric shirt at left? Choose from: (A) white fleece hoodie at center (B) orange cotton shirt at center" }, { "from": "gpt", "value": "(B) orange cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/438e8824eaf9a3fd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) khaki fabric coat at left (B) tan leather coat at left" }, { "from": "gpt", "value": "(B) tan leather coat at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9dc41b88b877c7f7.jpg", "conversations": [ { "from": "human", "value": "\nIs floral-patterned fabric skirt at lower right below shiny red fabric dress at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, floral-patterned fabric skirt at lower right is not positioned below shiny red fabric dress at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fabf4ce8aaf9c798.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte shirt at center to the left of dark brown leather jacket at lower left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white matte shirt at center is not to the left of dark brown leather jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d575b1e19ccef88f.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden signboard at upper right appear on the left side of green plaid kilt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, wooden signboard at upper right is not on the left side of green plaid kilt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cd62bb662d8631d.jpg", "conversations": [ { "from": "human", "value": "\nWhere is silver metallic laptop at center located in relation to green matte shirt at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ff6ece4a6819c93.jpg", "conversations": [ { "from": "human", "value": "\nDoes speckled orange and white fish at center come behind shiny orange fish at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, speckled orange and white fish at center is in front of shiny orange fish at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b8f4e6cc047d714.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.548, 0.300) (B) (0.761, 0.795) (C) (0.312, 0.286) (D) (0.161, 0.775)" }, { "from": "gpt", "value": "(A) (0.548, 0.300)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be7bff132bed7568.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.677, 0.517) (B) (0.582, 0.503) (C) (0.839, 0.708)" }, { "from": "gpt", "value": "(B) (0.582, 0.503)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7be1c40bf720e151.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte microphone at right smaller than black matte microphone at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, black matte microphone at right is smaller than black matte microphone at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a33bb4f887735893.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte jacket at center come behind white plastic ski at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of white plastic ski at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/679e585ecf8c4398.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) gray rock formation at center (B) american flag at upper right" }, { "from": "gpt", "value": "(A) gray rock formation at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42b5e7cf70aac832.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) polka dot fabric bag at center (B) cable-knit sweater at center" }, { "from": "gpt", "value": "(B) cable-knit sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9d75c7d8d1cb62a.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black cabinet at center wider than black matte speaker at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black cabinet at center is wider than black matte speaker at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85b7bb8d5483b4c8.jpg", "conversations": [ { "from": "human", "value": "\nDoes black leather suit at right appear over matte black scarf at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36287d5d3684aecc.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) dark gray sweater at center (B) black asphalt train track at left (C) dark gray fabric crowd at center (D) dark brown leather jacket at center" }, { "from": "gpt", "value": "(D) dark brown leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/963e983a34f38a25.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) light blue fabric swimsuit at lower right (B) light blue denim shorts at lower right" }, { "from": "gpt", "value": "(A) light blue fabric swimsuit at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2875a61953b9b6ab.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.397, 0.863) (B) (0.695, 0.489)" }, { "from": "gpt", "value": "(A) (0.397, 0.863)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1677877476b65a0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if leather jacket at center is positioned to the right of black plastic camera at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, leather jacket at center is to the left of black plastic camera at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b67026224604570.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) green leafy tree at upper center (B) black and white striped zebra at center (C) green grassy at center" }, { "from": "gpt", "value": "(A) green leafy tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0196fffa6795687e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.423, 0.981) (B) (0.071, 0.044) (C) (0.173, 0.453) (D) (0.825, 0.917)" }, { "from": "gpt", "value": "(C) (0.173, 0.453)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2a8cb0a25622a65.jpg", "conversations": [ { "from": "human", "value": "\nDoes greenish water at lower left have a larger size compared to white cotton person at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, greenish water at lower left has a larger size compared to white cotton person at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4df25c70b96c007.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte sailboat at center have a greater width compared to white glass space needle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white matte sailboat at center has a greater width compared to white glass space needle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bab5df80d62095b.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of white matte t-shirt at center in relation to matte black t-shirt at upper right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3ef03bd20a9a574.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the orange life vest at center from the following options: (A) green water at center (B) yellow textured life vest at center (C) green wood canoe at lower center (D) yellow fuzzy vest at left?" }, { "from": "gpt", "value": "(C) green wood canoe at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35aa6bf2ef686373.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) jeans at right (B) spotted fur harness at center (C) smooth rock at lower left" }, { "from": "gpt", "value": "(A) jeans at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3125bbb39d28f788.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny black dog at center above shiny brown dog at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, shiny black dog at center is not positioned above shiny brown dog at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6879fcd231743c5f.jpg", "conversations": [ { "from": "human", "value": "\nIs blue water at center positioned in front of smooth skin head at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, blue water at center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec2812936d95a67b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white matte building at center (B) smooth concrete pier at lower right (C) blue glassy water at center" }, { "from": "gpt", "value": "(C) blue glassy water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/855e60b1bb89aa51.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.540, 0.541) (B) (0.521, 0.564)" }, { "from": "gpt", "value": "(B) (0.521, 0.564)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b023784dc9601f36.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.673, 0.864) (B) (0.202, 0.611)" }, { "from": "gpt", "value": "(A) (0.673, 0.864)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e861cf4c35b8bb96.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the green soft grass at lower right from the following options: (A) green grass at lower left (B) brown leather boot at center (C) striped sweater at center (D) green grass at lower center?" }, { "from": "gpt", "value": "(D) green grass at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3847a4c4df8456e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) golden liquid at lower left (B) light brown wood table at left (C) white crumpled paper at lower right (D) white paper at center" }, { "from": "gpt", "value": "(D) white paper at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea07d732af49034b.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green grass at center more distant than that of black cotton t-shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green grass at center is in front of black cotton t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8163a5f0a132590.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic gold bikini at lower left to the left of white fabric umbrella at lower center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, metallic gold bikini at lower left is positioned on the left side of white fabric umbrella at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1aa6f3ddc863f5b8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.665, 0.342) (B) (0.343, 0.720) (C) (0.545, 0.875)" }, { "from": "gpt", "value": "(A) (0.665, 0.342)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/462eb022b1aad6d9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.342, 0.884) (B) (0.344, 0.189) (C) (0.765, 0.113)" }, { "from": "gpt", "value": "(A) (0.342, 0.884)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84ead0cad81c728e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the dark brown leather jacket at center? Select from: (A) camouflage fabric drum at center (B) blue water at lower center (C) matte black jacket at left (D) smooth wooden drum at lower center" }, { "from": "gpt", "value": "(D) smooth wooden drum at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37864b7dcb28fdcf.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) dark brown wooden stairs at upper right (B) clear acrylic display case at center" }, { "from": "gpt", "value": "(B) clear acrylic display case at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f67cc78f5984d62.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light blue denim jacket at center is positioned above smooth brown potato at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a561b1f573eab4c9.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent ice sculpture at center smaller than clear ice dragon at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, transparent ice sculpture at center might be larger than clear ice dragon at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ecda08cd53e0d674.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte suit at left smaller than white striped shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, black matte suit at left is not smaller in size than white striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70cbbeeac68dc4f3.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the black fabric shirt at center? Choose from: (A) yellow cardboard sign at center (B) white t-shirt at center (C) brown sweater at left (D) beige straw hat at upper right" }, { "from": "gpt", "value": "(B) white t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0331401e003c0c72.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of blue plastic slide at upper center and black glossy dog at upper right in the image provided, where is blue plastic slide at upper center located with respect to black glossy dog at upper right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac34fe01288bd2e4.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte gray cap at upper right located in relation to black fabric lanyard at right in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b6550cd9655cf0e.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown leather jacket at center bigger than blue denim jeans at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte brown leather jacket at center is larger in size than blue denim jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd8064f1b6c55353.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) green leafy tree at center (B) green matte tree at center (C) green grassy river at lower center (D) green matte evergreen tree at center-right" }, { "from": "gpt", "value": "(A) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/633b467523d48c00.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center have a smaller size compared to metallic gray boat at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, green leafy tree at center might be larger than metallic gray boat at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ae63f44082e7b16.jpg", "conversations": [ { "from": "human", "value": "\nIs pink fabric skateboarder at center closer to camera compared to matte pink shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, pink fabric skateboarder at center is in front of matte pink shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d8cdb80cdfb9cfb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte suit at center is positioned to the right of black silk tie at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find black matte suit at center to the right of black silk tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea98c02df23d0f9e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue jersey at center is wider than printed cotton t-shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, blue jersey at center has a greater width compared to printed cotton t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5cb8150cdd4a7094.jpg", "conversations": [ { "from": "human", "value": "\nDoes olive corduroy jacket at center have a lesser width compared to green knit beanie at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aecb402d493c6b46.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center have a smaller size compared to pink blossoms at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green grass at center is smaller than pink blossoms at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/188b5379f5af2b40.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white cotton shirt at center (B) pink fabric at lower center (C) black fabric shirt at center (D) matte red shirt at center" }, { "from": "gpt", "value": "(C) black fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3642f041dc0d3907.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the white glossy motorcycle at center? (A) white fabric flag at center (B) multicolored fabric at center" }, { "from": "gpt", "value": "(B) multicolored fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e04205d9bb944434.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.267, 0.328) (B) (0.717, 0.536)" }, { "from": "gpt", "value": "(B) (0.717, 0.536)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/627e7d908bd81b77.jpg", "conversations": [ { "from": "human", "value": "\nDoes green fabric backpack at center appear under textured blue baseball cap at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green fabric backpack at center is located below textured blue baseball cap at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/468f578869db9a1d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) tabby fur cat at center (B) green glossy eye at center (C) white plastic keyboard at upper center" }, { "from": "gpt", "value": "(C) white plastic keyboard at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fadad8a36aaf853.jpg", "conversations": [ { "from": "human", "value": "\nIs fuzzy brown dog at left smaller than fuzzy fur paw at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, fuzzy brown dog at left is not smaller than fuzzy fur paw at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f96ffdc75cf2d0f.jpg", "conversations": [ { "from": "human", "value": "\nIs gray stone base at lower center smaller than white stone soldier at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, gray stone base at lower center might be larger than white stone soldier at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8726f0c4d60dd76.jpg", "conversations": [ { "from": "human", "value": "\nIs brown brick pavement at lower left positioned at the back of green leafy hedge at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a95828ca6fa62b64.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the blue polished wood boat at upper right? Choose among these: (A) blue wooden boat at left (B) rusty rock at center" }, { "from": "gpt", "value": "(B) rusty rock at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4da948c7460521f7.jpg", "conversations": [ { "from": "human", "value": "\nDoes brick tower at right come in front of smooth stone tower at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b85b4990333fc11.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) yellow metal barrier at center (B) green fleece jacket at center" }, { "from": "gpt", "value": "(A) yellow metal barrier at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/988d16c62b79b32e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.950, 0.650) (B) (0.545, 0.364)" }, { "from": "gpt", "value": "(A) (0.950, 0.650)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b818be4e8cff8fb4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the porcelain doll at center? Select from: (A) shiny gold doll at center (B) white porcelain doll at center" }, { "from": "gpt", "value": "(A) shiny gold doll at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b396f52b0050b900.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the matte black shirt at center? Choose among these: (A) white glossy table at center (B) black fabric shirt at left (C) matte blue shirt at center" }, { "from": "gpt", "value": "(B) black fabric shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9448fa96eda42ac4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte screen at center is positioned above smooth skin face at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte screen at center is located above smooth skin face at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb61fadc5426ec35.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden sailboat at center appear over white wooden sailboat at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb58ec31382a0419.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the green leafy tree at center from the following options: (A) matte black cap at center (B) wooden bench at center?" }, { "from": "gpt", "value": "(A) matte black cap at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7364bd1202c6bce8.jpg", "conversations": [ { "from": "human", "value": "\nDoes black wood cabinet at upper center lie behind black wood bookcase at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/596b43b1eae2813e.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white cotton shirt at upper center in reference to floral-patterned tablecloth at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/750e879fc07a3094.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) matte black jacket at left (B) matte brown sweater at center, is positioned farthest from the knitted sweater at center?" }, { "from": "gpt", "value": "(A) matte black jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5dc53b41a965d75d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) blue glass traffic light at upper left (B) maroon/yellow locomotive at center, is positioned farthest from the brown gravel train track at left?" }, { "from": "gpt", "value": "(A) blue glass traffic light at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/786da314c596bec7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.600, 0.564) (B) (0.056, 0.714)" }, { "from": "gpt", "value": "(A) (0.600, 0.564)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8358f620cd2f6e6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.500, 0.833) (B) (0.562, 0.222)" }, { "from": "gpt", "value": "(B) (0.562, 0.222)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4b502e85e9bc419.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte gray suit at center appear on the right side of light gray checkered suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte gray suit at center is to the right of light gray checkered suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4cd310eaadc6aab.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) transparent glass fountain at center (B) transparent glass sphere at center" }, { "from": "gpt", "value": "(A) transparent glass fountain at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c02735ed80d2ccd5.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white glossy horse at upper left located relative to black glossy cape at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5193642917b0fc40.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.396, 0.844) (B) (0.179, 0.725) (C) (0.087, 0.972)" }, { "from": "gpt", "value": "(B) (0.179, 0.725)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2809e48dc52c9ed.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if striped woolen shawl at upper right is thinner than matte black face at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, striped woolen shawl at upper right is not thinner than matte black face at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc9c7ccb974a92b6.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray fur at center appear under fuzzy white fur at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, dark gray fur at center is not below fuzzy white fur at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cf769a1c0365388.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the matte red cowboy hat at upper center? (A) blue tulle ballet skirt at lower center (B) matte plastic toy gun at center" }, { "from": "gpt", "value": "(B) matte plastic toy gun at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c470155d1b76902.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) black fabric jacket at center (B) matte black backpack at left" }, { "from": "gpt", "value": "(B) matte black backpack at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eee59d89f34a460a.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of dark gray cloud at upper center in relation to brown wooden bench at lower center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15f5a4e802a2cdc7.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of metallic blue car at lower left in reference to metallic silver car at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb0926bbba9072c1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if knitted gray sweater at left is smaller than white striped sweater at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, knitted gray sweater at left occupies less space than white striped sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa55f075f5767ba1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) purple matte shirt at left (B) white glossy table at lower right" }, { "from": "gpt", "value": "(A) purple matte shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fee85e9ecf0b4418.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) dotted fabric bag at center (B) white cotton shirt at center" }, { "from": "gpt", "value": "(B) white cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10abe91264ea430c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.760, 0.069) (B) (0.154, 0.956)" }, { "from": "gpt", "value": "(A) (0.760, 0.069)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/265964eb7a057984.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red dress at center appear over matte black hoodie at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5959677e032e5ee.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray water at center to the right of green fabric dog at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find dark gray water at center to the right of green fabric dog at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29f02ff9a3982fb4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the metallic red car at left? Choose among these: (A) gray concrete curb at lower right (B) metallic blue sedan at right (C) shiny silver sedan at left (D) matte silver car at center-left" }, { "from": "gpt", "value": "(C) shiny silver sedan at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bb0ebd0fd0a4a42.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.589, 0.080) (B) (0.119, 0.741)" }, { "from": "gpt", "value": "(B) (0.119, 0.741)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1130491dca8a04a9.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue soft baby at center appear over black satin tie at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, blue soft baby at center is located above black satin tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f817ba3ab6df53df.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of black smooth suit at center less distant than that of patterned fabric bed at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black smooth suit at center is behind patterned fabric bed at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88d7c3fc982f5cd3.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white matte shirt at lower right and silhouette fabric at center in the image provided, where is white matte shirt at lower right located with respect to silhouette fabric at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6194b8aee7ac978c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown fuzzy coat at center is positioned to the left of wooden handrail at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, brown fuzzy coat at center is not on the left side of wooden handrail at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97e99b823367b9ae.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the matte red armchair at center? (A) black metal side table at right (B) white fabric lampshade at right (C) black glossy table at center (D) matte red chair at lower left" }, { "from": "gpt", "value": "(B) white fabric lampshade at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71095cb61cb5ef29.jpg", "conversations": [ { "from": "human", "value": "\nIs black velvet suit at left below black wool suit at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, black velvet suit at left is positioned under black wool suit at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf242e629078aef1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) speckled feathered pigeon at lower left (B) black polished stone pillar at center (C) glossy granite water at upper center (D) speckled feathered bird at upper right" }, { "from": "gpt", "value": "(A) speckled feathered pigeon at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d116fdda91d054e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) rusty rock cave at center (B) blue water at center" }, { "from": "gpt", "value": "(B) blue water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b0a6f3eef8e5321.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.940, 0.609) (B) (0.574, 0.500) (C) (0.307, 0.975) (D) (0.107, 0.463)" }, { "from": "gpt", "value": "(D) (0.107, 0.463)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d475dcccdf00a962.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at center is thinner than green textured tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green leafy tree at center has a lesser width compared to green textured tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de203547ddf20c0c.jpg", "conversations": [ { "from": "human", "value": "\nIs brown soil at center to the left of rocky gray mountain at upper center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, brown soil at center is to the right of rocky gray mountain at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91ca8ecef6c42805.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green smooth water at center is thinner than green leafy tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green smooth water at center's width is not less than green leafy tree at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5460b29e553a47b6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the yellowish paper stack at right? Select from: (A) wooden desk at center (B) white matte arc lamp at center" }, { "from": "gpt", "value": "(A) wooden desk at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7465509feff80ae.jpg", "conversations": [ { "from": "human", "value": "\nDoes floral dress at center appear over matte pink shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b4eec4033c5c2b5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dark brown leather jacket at center (B) transparent water at center (C) white matte boat at right" }, { "from": "gpt", "value": "(A) dark brown leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69116974a494d488.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if suede orange blazer at center is positioned above matte red dress at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, suede orange blazer at center is not positioned above matte red dress at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/792a5a45a5492030.jpg", "conversations": [ { "from": "human", "value": "\nDoes purple fleece jacket at center have a smaller size compared to smooth gray rock at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, purple fleece jacket at center has a smaller size compared to smooth gray rock at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06a400e0ff05bb45.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the gray fabric shoe at lower center? Select from: (A) white fabric sock at lower center (B) leopard print leggings at center (C) white canvas shoe at lower center" }, { "from": "gpt", "value": "(B) leopard print leggings at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2eba9a263076a800.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if beige cotton shirt at right is positioned above white matte projector screen at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, beige cotton shirt at right is not positioned above white matte projector screen at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a1c861c3c746637.jpg", "conversations": [ { "from": "human", "value": "\nWhere is gray stone path at center located in relation to greenish-blue water at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/120116ad430edc03.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.178, 0.352) (B) (0.156, 0.322) (C) (0.257, 0.748)" }, { "from": "gpt", "value": "(C) (0.257, 0.748)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f964ccf047af528a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the velvet black coat at center? (A) blue denim jacket at lower right (B) gray concrete pavement at lower right" }, { "from": "gpt", "value": "(B) gray concrete pavement at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80fbf48c72efc61a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) dark gray fabric jacket at left (B) dark blue uniform at center" }, { "from": "gpt", "value": "(B) dark blue uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6ec2c745a0d8040.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte cookie at left lie behind white frosted biscuit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/486c936f5b7e3953.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of yellow wooden church at center in reference to striped cotton sweater at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f77a77c1cfba0fa.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white cotton shirt at lower left (B) white fabric bag at lower left" }, { "from": "gpt", "value": "(B) white fabric bag at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07db87a1a4810464.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.551, 0.592) (B) (0.434, 0.592)" }, { "from": "gpt", "value": "(A) (0.551, 0.592)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/660bb9be0e5f784c.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black hair at upper center positioned in front of black metallic microphone at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb7b4a22abac744b.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the white satin dress at lower right from the following options: (A) sunglasses at upper right (B) light blue satin dress at lower right?" }, { "from": "gpt", "value": "(A) sunglasses at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88f45617be5137e6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte wood cabin at center is wider than wooden signpost at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte wood cabin at center is wider than wooden signpost at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78ad4d63d53eec70.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the dark gray suit at right from the following options: (A) dark gray jacket at lower left (B) dark brown leather coat at center (C) plaid wool coat at lower right (D) matte black suit at center?" }, { "from": "gpt", "value": "(C) plaid wool coat at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46f27f238c4847ee.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.634, 0.934) (B) (0.811, 0.883) (C) (0.674, 0.539)" }, { "from": "gpt", "value": "(C) (0.674, 0.539)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47c1b778fba59c1d.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the blue fabric at center? (A) floral fabric shirt at center (B) matte pink blouse at upper left" }, { "from": "gpt", "value": "(A) floral fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e7c7182e2a5696e.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic chain at center thinner than gold shiny shoe at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, metallic chain at center's width is less than gold shiny shoe at lower left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6781b0d5474c61f2.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.138, 0.586) (B) (0.670, 0.397) (C) (0.838, 0.681)" }, { "from": "gpt", "value": "(C) (0.838, 0.681)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/132471d2a85c4a9e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) light blue denim jeans at center (B) blue fabric jacket at lower left" }, { "from": "gpt", "value": "(A) light blue denim jeans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a3c441ee0f2fd79.jpg", "conversations": [ { "from": "human", "value": "\nIs brown shingles at center above golden stone bell tower at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, brown shingles at center is not positioned above golden stone bell tower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad44de50c16d28a8.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the shiny black crow at upper left? (A) shiny black raven at center (B) brown matte bread at center" }, { "from": "gpt", "value": "(A) shiny black raven at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7e0079514d60904.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the pink fabric neckband at center? Choose among these: (A) brindle fur bulldog at right (B) striped cotton blanket at center (C) beige fur pug at center" }, { "from": "gpt", "value": "(C) beige fur pug at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9de42dafbf18dbbe.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.803, 0.406) (B) (0.725, 0.539) (C) (0.547, 0.706)" }, { "from": "gpt", "value": "(B) (0.725, 0.539)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24f633b874a6b047.jpg", "conversations": [ { "from": "human", "value": "\nDoes metal wire fence at upper center appear on the right side of spotted fur cheetah at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, metal wire fence at upper center is not on the right side of spotted fur cheetah at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d143897f2794120.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green glossy duck at center is positioned below shiny green duck at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green glossy duck at center is located below shiny green duck at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bac8a97599da128.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green rubber apron at center (B) black rubber apron at right" }, { "from": "gpt", "value": "(A) green rubber apron at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6a238c61186e77f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.050, 0.341) (B) (0.569, 0.269)" }, { "from": "gpt", "value": "(B) (0.569, 0.269)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64a6b3c3aaee5ea6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.623, 0.531) (B) (0.620, 0.856) (C) (0.834, 0.698)" }, { "from": "gpt", "value": "(A) (0.623, 0.531)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00ca3f7f8d884140.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white feathered bra at left is positioned below black reflective sunglasses at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white feathered bra at left is positioned under black reflective sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/499302d5aa2b492c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) shiny reflective water at center (B) golden textured clouds at upper center (C) green matte trees at center" }, { "from": "gpt", "value": "(A) shiny reflective water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57ad75be56dbddb9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte shirt at center is thinner than matte pink blouse at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, black matte shirt at center might be wider than matte pink blouse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b443fe596e32889.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray matte bird at center have a lesser width compared to pinkish-brown textured beak at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, gray matte bird at center's width is not less than pinkish-brown textured beak at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a09bd223da765167.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of white shredded onion at right in relation to black plastic knife at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45c6bdc21d69e30d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.101, 0.686) (B) (0.883, 0.637)" }, { "from": "gpt", "value": "(B) (0.883, 0.637)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76c696116a9bf350.jpg", "conversations": [ { "from": "human", "value": "\nDoes weathered wood hut at center have a greater width compared to yellow plastic dock at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, weathered wood hut at center might be narrower than yellow plastic dock at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f8f5e3d550dca11.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.145, 0.644) (B) (0.683, 0.047) (C) (0.303, 0.759)" }, { "from": "gpt", "value": "(B) (0.683, 0.047)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93927f3b0311ae84.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black vest at center further to camera compared to neon yellow reflective vest at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte black vest at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32f11e6bbf85f4e2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) brown furry cow at lower left (B) dark brown fur cow at lower left (C) green grassy hillside at upper center" }, { "from": "gpt", "value": "(C) green grassy hillside at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc31d0c4f01b89f7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white striped shirt at left (B) purple wool scarf at center (C) dark gray suit at center" }, { "from": "gpt", "value": "(B) purple wool scarf at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/529a0e0b612e62ec.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte yellow shirt at center located relative to light brown wooden chair at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1065222a8b02328d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte white balloon at center (B) matte red balloon at left" }, { "from": "gpt", "value": "(A) matte white balloon at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4fa9b312f0e1f1d.jpg", "conversations": [ { "from": "human", "value": "\nIs white shirt at center bigger than green fabric flag at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96e9e726121e7bd5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if beige fabric curtain at left is positioned below black matte shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, beige fabric curtain at left is not positioned below black matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba0eccd67576ed84.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray matte t-shirt at center appear on the left side of brown matte sunglasses at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, gray matte t-shirt at center is positioned on the left side of brown matte sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e77f0220284626ea.jpg", "conversations": [ { "from": "human", "value": "\nIs black ink sketch of face at center positioned at the back of smooth black face at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0cb47b449b86e1f9.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of shiny black suit at center in relation to black matte camera at lower left? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8f6bd23c22e0056.jpg", "conversations": [ { "from": "human", "value": "\nIs clear water at lower center positioned in front of gray metallic ship at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, clear water at lower center is in front of gray metallic ship at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c64e990c4d321097.jpg", "conversations": [ { "from": "human", "value": "\nIs gray cotton shirt at center positioned at the back of white plastic computer desk at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of white plastic computer desk at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c33117b2b52fd214.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of red matte shirt at center in relation to yellow fabric shirt at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/285ed77705189a51.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.648, 0.556) (B) (0.481, 0.348) (C) (0.404, 0.412) (D) (0.258, 0.584)" }, { "from": "gpt", "value": "(A) (0.648, 0.556)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa9bd3b09cd59a95.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) translucent glass beer at lower left (B) striped cotton shirt at center" }, { "from": "gpt", "value": "(A) translucent glass beer at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b22856b7f418dbd.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark suit at center have a smaller size compared to maroon textured tie at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, dark suit at center might be larger than maroon textured tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fedf6b560a30ab41.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy plant at lower left is positioned below glossy red berry at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green leafy plant at lower left is below glossy red berry at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8808b5f19f82b31f.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green leafy tree at center in relation to green grass at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/181dbad0d1fb2c6e.jpg", "conversations": [ { "from": "human", "value": "\nDoes light blue cotton shirt at center have a smaller size compared to blonde curly hair at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, light blue cotton shirt at center has a smaller size compared to blonde curly hair at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ce18b09ef64f1d5.jpg", "conversations": [ { "from": "human", "value": "\nDoes brushed metal mountain at center appear on the left side of silver metallic trailer at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brushed metal mountain at center is to the left of silver metallic trailer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71e635d575644478.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.116, 0.764) (B) (0.561, 0.688)" }, { "from": "gpt", "value": "(A) (0.116, 0.764)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5258f8a96416646.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden bay window at center below white matte totoro at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, wooden bay window at center is above white matte totoro at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54f748082a1f884b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white floral shirt at center is thinner than green leafy lei at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, white floral shirt at center's width is less than green leafy lei at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/493b79f04f570972.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the white cotton shirt at center? (A) pink striped polo shirt at center (B) light blue t-shirt at center" }, { "from": "gpt", "value": "(B) light blue t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b710e497c7f7d7e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark brown hair at right is positioned to the left of pale skin ear at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, dark brown hair at right is not to the left of pale skin ear at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e56b94af90029584.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the yellow foam ring at center? Choose from: (A) matte black swimsuit at center (B) transparent plastic goggles at upper center" }, { "from": "gpt", "value": "(B) transparent plastic goggles at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5061183de0b079a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.202, 0.762) (B) (0.865, 0.770)" }, { "from": "gpt", "value": "(B) (0.865, 0.770)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d8b696963d8f731.jpg", "conversations": [ { "from": "human", "value": "\nIs foggy smoke at upper center wider than shiny reflective water at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, foggy smoke at upper center is wider than shiny reflective water at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79b7ecc4d56f21f4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy trees at center is wider than green textured tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of green leafy trees at center exceeds that of green textured tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0b74f458b71e9ca.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte pink coat at lower center is positioned below matte pink jacket at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte pink coat at lower center is located below matte pink jacket at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83f5059b6e2c69a2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden sign at center is positioned above matte glass door at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, wooden sign at center is not above matte glass door at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bd3b5720be38b37.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper left is thinner than black plastic stool at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, green leafy tree at upper left might be wider than black plastic stool at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d912b60fbeb2627.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) shiny gold helmet at right (B) black suit at center" }, { "from": "gpt", "value": "(A) shiny gold helmet at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9123fbb119ea1c0.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of dark brown backpack at center in relation to dark brown hair at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b4890d949f70d9e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green striped fabric at lower left is wider than white paper tray at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, green striped fabric at lower left might be narrower than white paper tray at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2de4e2ad43729499.jpg", "conversations": [ { "from": "human", "value": "\nWhere is silver metallic van at center-left located in relation to pink fabric bag at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d8f3afb9971ac18.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.763, 0.639) (B) (0.975, 0.878)" }, { "from": "gpt", "value": "(B) (0.975, 0.878)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1228ddb1b676d7f3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the silky red fabric at center? (A) matte floral fabric hand at center (B) smooth skin hand at center" }, { "from": "gpt", "value": "(B) smooth skin hand at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba36544ef08a226c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.440, 0.487) (B) (0.185, 0.802) (C) (0.615, 0.148) (D) (0.894, 0.992)" }, { "from": "gpt", "value": "(B) (0.185, 0.802)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/613b605d6285f98e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.722, 0.991) (B) (0.626, 0.911)" }, { "from": "gpt", "value": "(B) (0.626, 0.911)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9176fce8f6513404.jpg", "conversations": [ { "from": "human", "value": "\nIs blue water at lower center bigger than green leafy tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, blue water at lower center might be smaller than green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24e9d38fbbbf8119.jpg", "conversations": [ { "from": "human", "value": "\nDoes snow-covered evergreen at center appear over black matte ski suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, snow-covered evergreen at center is located above black matte ski suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d91f6eed05382304.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.866, 0.977) (B) (0.655, 0.953) (C) (0.506, 0.886)" }, { "from": "gpt", "value": "(B) (0.655, 0.953)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df4db6824a5efd72.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) green fleece vest at lower right (B) green leafy palm tree at upper left (C) dark blue jacket at center (D) dark gray sweater at center" }, { "from": "gpt", "value": "(A) green fleece vest at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a8e3444d45cb060.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) clear glass pond at center (B) green leafy tree at lower left (C) green leafy tree at upper left" }, { "from": "gpt", "value": "(A) clear glass pond at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e213f591439e462.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte jacket at center have a greater width compared to light beige shirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black matte jacket at center's width does not surpass light beige shirt at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c10c42bad67ea8a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) green matte shirt at center (B) matte red dress at center" }, { "from": "gpt", "value": "(B) matte red dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3500127294079b87.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray jacket at center appear on the right side of light blue denim jeans at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, dark gray jacket at center is to the right of light blue denim jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df2489fc61b4d924.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.230, 0.689) (B) (0.274, 0.702)" }, { "from": "gpt", "value": "(B) (0.274, 0.702)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09a4078cc6b1a4a2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) clear glass water at table center (B) black matte shirt at left (C) yellow t-shirt at left" }, { "from": "gpt", "value": "(B) black matte shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c76bebeadeaaf4f.jpg", "conversations": [ { "from": "human", "value": "\nWhere is silhouette fabric at center located in relation to matte blue shirt at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d15569b076f1792c.jpg", "conversations": [ { "from": "human", "value": "\nDoes rusty metal building at center have a greater width compared to white metallic excavator at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50431dfa375fe4a6.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of brown matte pot at center and white fluffy rice at upper right in the image provided, where is brown matte pot at center located with respect to white fluffy rice at upper right? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8a2d5199f1b4526.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.127, 0.384) (B) (0.594, 0.903)" }, { "from": "gpt", "value": "(B) (0.594, 0.903)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7363caf09d58117.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.303, 0.377) (B) (0.819, 0.398)" }, { "from": "gpt", "value": "(A) (0.303, 0.377)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5329c319a36d3a65.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) black matte octopus at center (B) blue glossy puddle at center" }, { "from": "gpt", "value": "(B) blue glossy puddle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d789f4eb4de666b7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white paper sign at center is smaller than black wrought iron lamp post at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84ef800d7086dd64.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) concrete top table at center (B) yellowtextured fabricpillow at center (C) pink gingham pillow at left" }, { "from": "gpt", "value": "(B) yellowtextured fabricpillow at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b623e03ea901c2ed.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of cloudy sky at upper center in relation to matte black car at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6999258eaeb8b0e3.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton dress at center in front of white matte donkey at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white cotton dress at center is behind white matte donkey at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ea90df6f307d616.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) matte black shirt at left (B) pink checkered jacket at upper left" }, { "from": "gpt", "value": "(B) pink checkered jacket at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a90f9aae4e18b08.jpg", "conversations": [ { "from": "human", "value": "\nIs blue matte van at center above white matte sign at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, blue matte van at center is below white matte sign at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd6e417a2918938b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.184, 0.303) (B) (0.266, 0.956)" }, { "from": "gpt", "value": "(A) (0.184, 0.303)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dec166f817c1393d.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the textured fabric shirt at center? (A) blue fabric shirt at center (B) beige stone pillar at center" }, { "from": "gpt", "value": "(B) beige stone pillar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0771693aede2a7da.jpg", "conversations": [ { "from": "human", "value": "\nIs matte skin at center to the left of tan fabric hat at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, matte skin at center is positioned on the left side of tan fabric hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5cfbfc47e5354a5a.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is silhouette leafy tree at lower left located relative to gray/cloudy sky at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7bf1b19ff2b051c.jpg", "conversations": [ { "from": "human", "value": "\nWhere is pink fabric cape at center located in relation to green matte coat at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b27fe967a20b4d28.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange cotton shirt at lower right is positioned above matte gray sweater at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abea15c2de2c7ec0.jpg", "conversations": [ { "from": "human", "value": "\nIs dark blue striped shirt at center below white matte t-shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, dark blue striped shirt at center is positioned under white matte t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3118e0abc6886bb7.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white plastic kindle at right (B) brown/kraft paper amazonkindle at center" }, { "from": "gpt", "value": "(A) white plastic kindle at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00762e909dd970e9.jpg", "conversations": [ { "from": "human", "value": "\nIs matte yellow wall at left to the left of brown fabric at right from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte yellow wall at left is to the left of brown fabric at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7aefd23c953cd20e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) blue denim overalls at upper center (B) orange/white striped traffic cone at lower center, is positioned farthest from the white metallic utility truck at lower left?" }, { "from": "gpt", "value": "(A) blue denim overalls at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cb7de0259e942bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.495, 0.355) (B) (0.318, 0.730) (C) (0.041, 0.406) (D) (0.729, 0.519)" }, { "from": "gpt", "value": "(C) (0.041, 0.406)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ab89a481e2c83ed.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.525, 0.688) (B) (0.564, 0.691)" }, { "from": "gpt", "value": "(B) (0.564, 0.691)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8844a4857f64298.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the gray cloudy sky at upper center? (A) green forested mountain at center (B) green matte forest at center" }, { "from": "gpt", "value": "(B) green matte forest at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d96eb6bbd6d6f56b.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the green grass at center among (A) white cotton shirt at center (B) black smooth hair at upper left?" }, { "from": "gpt", "value": "(B) black smooth hair at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8cf1a7f26850cb9.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the light blue uniform at left? (A) matte blue uniform at left (B) gray striped suit at right (C) camouflage uniform at center" }, { "from": "gpt", "value": "(A) matte blue uniform at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bbf7631a00bddc8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white matte shirt at center (B) brown fabric couch at center (C) brown fabric pillow at center" }, { "from": "gpt", "value": "(A) white matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c9d328ecd6199c6.jpg", "conversations": [ { "from": "human", "value": "\nIs clear blue water at center thinner than green matte tree at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6867dad67303d21f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.582, 0.494) (B) (0.664, 0.780)" }, { "from": "gpt", "value": "(B) (0.664, 0.780)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4da01e27fdea492f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the metallic blue train at center? Select from: (A) light blue jeans at center (B) jeans at left (C) white shirt at left" }, { "from": "gpt", "value": "(B) jeans at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfcab47b88dadfaa.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green plastic computer at upper right is smaller than white fabric at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green plastic computer at upper right is smaller than white fabric at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0dd5d8b22aeb6fa2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) green matte glass jar at center (B) green matte jar at center (C) green matte jar at left" }, { "from": "gpt", "value": "(A) green matte glass jar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81263c8cf5acee76.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic brown rhinoceros at center to the right of gray matte rhinoceros at left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, metallic brown rhinoceros at center is to the left of gray matte rhinoceros at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94205e74cc733750.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the brown textured sweater at center from the following options: (A) brown leather jacket at center (B) brown textured jacket at center (C) white dotted fabric dress at left (D) brown hair at center?" }, { "from": "gpt", "value": "(C) white dotted fabric dress at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0715fb7241b39e00.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the transparent glass table at lower left? Choose among these: (A) matte black jacket at center (B) plaid wool jacket at center" }, { "from": "gpt", "value": "(A) matte black jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ad74c4bb1703aae.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.020, 0.152) (B) (0.694, 0.575) (C) (0.462, 0.936)" }, { "from": "gpt", "value": "(A) (0.020, 0.152)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/027a5fd16ebb018c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.497, 0.686) (B) (0.774, 0.455) (C) (0.287, 0.728) (D) (0.902, 0.872)" }, { "from": "gpt", "value": "(A) (0.497, 0.686)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a379f376d5f3751e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the gray fabric jacket at center? Choose among these: (A) light gray sweatshirt at upper right (B) checkered fabric shirt at center (C) light brown hair at lower left" }, { "from": "gpt", "value": "(B) checkered fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ec9ccf29f77c44a.jpg", "conversations": [ { "from": "human", "value": "\nWhere is golden fur dog at center located in relation to shiny brown teeth at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07edac9e9350ea07.jpg", "conversations": [ { "from": "human", "value": "\nWhere is blue fabric judo gi at center located in relation to blue fabric kimono at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55ef26e400ab32f2.jpg", "conversations": [ { "from": "human", "value": "\nIs brown wooden gazebo at center further to the viewer compared to green matte hedge at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06cc7f78c29b1c10.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green painted wood at upper center less distant than that of speckled feathered duck at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green painted wood at upper center is behind speckled feathered duck at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df000ce9c5d95e89.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red train at left below matte orange train at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte red train at left is not below matte orange train at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49e92b934904759f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte blue airplane at center is wider than metallic blue airplane at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ada3737246167bbc.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.030, 0.131) (B) (0.698, 0.044)" }, { "from": "gpt", "value": "(B) (0.698, 0.044)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86871eae69ca61c8.jpg", "conversations": [ { "from": "human", "value": "\nIs dark fabric shirt at right smaller than black matte head at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dark fabric shirt at right is not smaller than black matte head at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c22c553c071053a7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.716, 0.522) (B) (0.466, 0.905)" }, { "from": "gpt", "value": "(B) (0.466, 0.905)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63f49928d806b72f.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the dark glass mug at left from the following options: (A) knitted scarf at upper center (B) white knitted scarf at upper center (C) clear glass water at center?" }, { "from": "gpt", "value": "(A) knitted scarf at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a4d7d653d37213e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.348, 0.833) (B) (0.723, 0.817) (C) (0.346, 0.242) (D) (0.968, 0.759)" }, { "from": "gpt", "value": "(D) (0.968, 0.759)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/927594e5b6d7e1f2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny red carriage at center is thinner than shiny silver carriage at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, shiny red carriage at center might be wider than shiny silver carriage at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df1aeeb55bbb7aea.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if concrete at center is positioned to the right of white glossy sedan at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, concrete at center is not on the right side of white glossy sedan at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/027ac2696f8daf6e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the blue glossy eye at upper center? Select from: (A) pink fabric shirt at left (B) smooth skin face at center (C) blue glossy eye at center" }, { "from": "gpt", "value": "(A) pink fabric shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd10f9ea1d1aee79.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the yellow glass traffic light at upper center? Select from: (A) white plastic license plate at center (B) shiny silver sedan at center" }, { "from": "gpt", "value": "(A) white plastic license plate at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1339cb00f86a1368.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.828, 0.905) (B) (0.548, 0.839) (C) (0.683, 0.547) (D) (0.295, 0.573)" }, { "from": "gpt", "value": "(A) (0.828, 0.905)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1a010afbb72c3cf.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth skin face at center appear under tan leather jacket at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, smooth skin face at center is not below tan leather jacket at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7b1c1f8a9ba2ecc.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte black jacket at center located in relation to corduroy red jacket at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73a19ecdd30c68ff.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of white fabric canopy at upper center in relation to beige fabric jacket at left? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d2b0a5c859562a5.jpg", "conversations": [ { "from": "human", "value": "\nIs translucent glass bottle at upper right to the right of translucent glass bottle at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, translucent glass bottle at upper right is positioned on the right side of translucent glass bottle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec4887240ace195e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.905, 0.378) (B) (0.420, 0.109)" }, { "from": "gpt", "value": "(B) (0.420, 0.109)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/037dc1a85d096ee4.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the green rough bark tree at center from the following options: (A) dry grass at center (B) green-brown bark tree at center?" }, { "from": "gpt", "value": "(B) green-brown bark tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4dc4f774da1f3663.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.848, 0.567) (B) (0.556, 0.477) (C) (0.138, 0.706)" }, { "from": "gpt", "value": "(C) (0.138, 0.706)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc253460d4bc83e1.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink fabric dress at left appear over clear plastic cup at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, pink fabric dress at left is positioned over clear plastic cup at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ffe6ff79df2c16e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the red marble column at center? (A) green leafy tree at upper center (B) reddish-brown stone column at left (C) smooth terracotta column at center" }, { "from": "gpt", "value": "(A) green leafy tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf98eb707b31ba17.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of smooth gray sweater at center less distant than that of matte pink sweater at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, smooth gray sweater at center is in front of matte pink sweater at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78a15379ff4d0c5e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) leather jacket at left (B) matte red jacket at center (C) leather jacket at center" }, { "from": "gpt", "value": "(A) leather jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcd8d14c586ae1d7.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white cotton shirt at center located in relation to matte black camera at right in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd3fcdeb6dcf2fa6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.539, 0.159) (B) (0.213, 0.620) (C) (0.606, 0.780)" }, { "from": "gpt", "value": "(A) (0.539, 0.159)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66e04a3974d38b1f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) rusty metal cannon at lower center (B) rusty metal cannon at center" }, { "from": "gpt", "value": "(B) rusty metal cannon at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7653fd6797ce246.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the matte brown leather jacket at center? (A) white matte shirt at center (B) light brown leather jacket at center" }, { "from": "gpt", "value": "(B) light brown leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd41b7120551af4c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) plaid fabric shirt at center (B) wooden board at right" }, { "from": "gpt", "value": "(A) plaid fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5150e9558cb65388.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.477, 0.634) (B) (0.521, 0.820)" }, { "from": "gpt", "value": "(A) (0.477, 0.634)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8bb3f6e25c93caa.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown wooden barrel at center wider than denim overalls at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, dark brown wooden barrel at center is wider than denim overalls at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de3a88d26bbf5a8a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the green glossy tree at upper right? Select from: (A) green forested mountain at upper left (B) gray/rough rock at center" }, { "from": "gpt", "value": "(B) gray/rough rock at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/121a502777bba247.jpg", "conversations": [ { "from": "human", "value": "\nDoes dusty gravel dirt track at lower left lie behind white plastic sign at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf70a9830d7eff5b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) brown glossy shredded meat at center (B) skinny flesh at lower left" }, { "from": "gpt", "value": "(B) skinny flesh at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61c3d32f92c87e5c.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent glass table at lower center appear on the left side of yellow matte chips at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, transparent glass table at lower center is to the left of yellow matte chips at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b7cb2656f858463.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) transparent glass table at center (B) matte black suit at center (C) translucent plastic water bottle at center (D) patterned silk tie at center" }, { "from": "gpt", "value": "(A) transparent glass table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a55dd0e7e093808.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.560, 0.738) (B) (0.749, 0.436)" }, { "from": "gpt", "value": "(A) (0.560, 0.738)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17afd5e42e4a2f48.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.982, 0.659) (B) (0.279, 0.619) (C) (0.129, 0.300)" }, { "from": "gpt", "value": "(B) (0.279, 0.619)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23e5c861e681d06b.jpg", "conversations": [ { "from": "human", "value": "\nDoes metallic red crane at center have a lesser width compared to metallic gray pole at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, metallic red crane at center is not thinner than metallic gray pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fc76958ac7b03bd.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.441, 0.523) (B) (0.348, 0.680) (C) (0.800, 0.734) (D) (0.163, 0.842)" }, { "from": "gpt", "value": "(D) (0.163, 0.842)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87d34fa2e3ed4923.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white paper champions tour sign at center is positioned above black matte tripod at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a83541660cafd6f.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the yellow leafy tree at center from the following options: (A) yellow-green grass at center (B) green matte tree at left (C) golden yellow leaves at center?" }, { "from": "gpt", "value": "(C) golden yellow leaves at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d8669aa397688cb.jpg", "conversations": [ { "from": "human", "value": "\nDoes denim jacket at center have a smaller size compared to faded denim jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, denim jacket at center is not smaller in size than faded denim jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37ec33ace31d48d4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.121, 0.570) (B) (0.212, 0.467) (C) (0.040, 0.719)" }, { "from": "gpt", "value": "(A) (0.121, 0.570)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2e50d639860b3e7.jpg", "conversations": [ { "from": "human", "value": "\nIs brick pavement at center behind fluffy brown jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06d6459fa45fa92a.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white paper at center and white soft beard at left in the image provided, where is white paper at center located with respect to white soft beard at left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b59aa557aa2ee16.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.148, 0.808) (B) (0.403, 0.450) (C) (0.625, 0.809)" }, { "from": "gpt", "value": "(B) (0.403, 0.450)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2af0144cea1cb73c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the brick church at center? Select from: (A) smooth brown spire at center (B) brick tower at center" }, { "from": "gpt", "value": "(B) brick tower at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f9c7655f1edd115.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light green striped shirt at center is bigger than white cotton shirt at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, light green striped shirt at center might be smaller than white cotton shirt at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ea826054cef9d27.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte high-top boot at center appear under black matte shoe at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, black matte high-top boot at center is located below black matte shoe at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35aea8ba0c5cf3bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) rusty wood porch at center (B) rusty wood hut at center" }, { "from": "gpt", "value": "(A) rusty wood porch at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e3ed17d75206b2a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) shiny black car at lower left (B) concrete bridge at upper center" }, { "from": "gpt", "value": "(A) shiny black car at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eacce49f67fdea1b.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte dress at center above floral dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, black matte dress at center is above floral dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13e7f576df04ce45.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.569, 0.294) (B) (0.275, 0.463) (C) (0.621, 0.998)" }, { "from": "gpt", "value": "(A) (0.569, 0.294)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87ecd1dda899efa9.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of brown matte tree at left in reference to rustic stone hut at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/348ae8f1346d1e75.jpg", "conversations": [ { "from": "human", "value": "\nIs green textured pine tree at center to the left of golden textured moon at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green textured pine tree at center is not on the left side of golden textured moon at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b30d7148a6249d5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.308, 0.434) (B) (0.355, 0.275)" }, { "from": "gpt", "value": "(B) (0.355, 0.275)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f6076a6df81daf9.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of striped sweater at left in relation to silver metallic laptop at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b8b5b233ec30b75.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink glossy tongue at center have a smaller size compared to pink glossy tongue at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, pink glossy tongue at center is smaller than pink glossy tongue at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbd94024370119b9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.032, 0.430) (B) (0.865, 0.812)" }, { "from": "gpt", "value": "(B) (0.865, 0.812)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10f942557f7af476.jpg", "conversations": [ { "from": "human", "value": "\nIs black smooth dog at center to the left of tan/khaki shorts at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find black smooth dog at center to the left of tan/khaki shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/088a58e0370a6f10.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of shiny black jacket at center in relation to brown leather bag at right? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9657a6a9589ff48.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the wooden planter at lower right? Choose among these: (A) wooden at center (B) white metal railing at center" }, { "from": "gpt", "value": "(A) wooden at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd5f9b6166d81c38.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.215, 0.527) (B) (0.321, 0.520) (C) (0.462, 0.548) (D) (0.568, 0.566)" }, { "from": "gpt", "value": "(A) (0.215, 0.527)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8250eb66f9b7af15.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) light brown textured shirt at right (B) white fabric at center (C) blue fabric hair tie at upper left (D) white cloth shirt at center" }, { "from": "gpt", "value": "(A) light brown textured shirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1bd45e4d56c041d4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the white glossy car at right? Select from: (A) matte black suv at left (B) metallic blue truck at center" }, { "from": "gpt", "value": "(B) metallic blue truck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/607d7f128e8633ca.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white stone tower at left is thinner than white fog at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white stone tower at left is not thinner than white fog at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65a66d800f76ecd8.jpg", "conversations": [ { "from": "human", "value": "\nDoes green rough bark tree at center appear under green mossy hut at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d056c45cc2e75c86.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown hat at upper right positioned at the back of black reflective sunglasses at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of black reflective sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1401c9e5f29ce69f.jpg", "conversations": [ { "from": "human", "value": "\nIs orange cotton shirt at center further to camera compared to orange cotton tunic at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8fedf7d029fa922.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white glossy ferry at center (B) brown clay houses at upper center" }, { "from": "gpt", "value": "(A) white glossy ferry at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db6db1b7a61e4487.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white plastic gas sign at left (B) white powdery snow at center" }, { "from": "gpt", "value": "(A) white plastic gas sign at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d39eba9cdf55d85.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of brown fuzzy horse at center in relation to brown shiny horse at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b74ad181941d116.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is pink smooth pig at center located relative to pink spotted pig at upper center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9130752afcc59f5.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink matte cloud at upper center come behind green leafy tree at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is behind green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b95eb5fcbad2f63.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte t-shirt at left appear under khaki pants at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white matte t-shirt at left is not below khaki pants at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/887325e58d61ebbe.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) matte paper number at center (B) matte yellow tank top at center (C) matte red tank top at right" }, { "from": "gpt", "value": "(A) matte paper number at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62e8cc8d3d936b5e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) translucent plastic cup at center (B) clear glass at left" }, { "from": "gpt", "value": "(A) translucent plastic cup at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9718f05ddc7f3f38.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.765, 0.822) (B) (0.230, 0.653) (C) (0.125, 0.950) (D) (0.198, 0.695)" }, { "from": "gpt", "value": "(C) (0.125, 0.950)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8c9382241257e87.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the blonde hair at lower right? Select from: (A) striped fabric jacket at center (B) bald head at lower left (C) green fabric flag at upper left (D) matte gray sweater at lower right" }, { "from": "gpt", "value": "(C) green fabric flag at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d30efaa331c0f177.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue glossy paddleboard at center is thinner than matte blue shorts at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9606369a9f3fc6f3.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.180, 0.875) (B) (0.445, 0.567)" }, { "from": "gpt", "value": "(A) (0.180, 0.875)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/edeb62541c54ffc1.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the dark gray fabric pants at lower left among (A) light brown leather jacket at center (B) red plaid shirt at center (C) floral-patterned sweater at center (D) dark gray fabric jacket at lower right?" }, { "from": "gpt", "value": "(D) dark gray fabric jacket at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9cf1d4be56112d1e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.225, 0.552) (B) (0.636, 0.922) (C) (0.594, 0.692) (D) (0.861, 0.678)" }, { "from": "gpt", "value": "(D) (0.861, 0.678)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f961508b536c9e3.jpg", "conversations": [ { "from": "human", "value": "\nIs silver metallic car at center smaller than yellow matte license plate at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, silver metallic car at center is not smaller in size than yellow matte license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19a32f280222a577.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the matte red electric guitar at left? Choose among these: (A) matte blue electric guitar at right (B) blue glossy electric guitar at center (C) matte black guitar at left" }, { "from": "gpt", "value": "(C) matte black guitar at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/252906cf09433cd1.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) striped shirt at left (B) clear glass bowl at center (C) white cotton shirt at center" }, { "from": "gpt", "value": "(A) striped shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78482d6f8b45ef92.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) green grass field at lower center (B) yellow matte house at right (C) wooden hut at lower left" }, { "from": "gpt", "value": "(A) green grass field at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/571d21c9eb8029f0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange smooth carrots at center is positioned to the left of green leafy at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find orange smooth carrots at center to the left of green leafy at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47cae27c897329fc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.577, 0.695) (B) (0.270, 0.406) (C) (0.744, 0.859)" }, { "from": "gpt", "value": "(A) (0.577, 0.695)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1df5766f782858fb.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black matte shirt at center located in relation to dark brown leather jacket at center in the image? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb5329aa4cf0a8d1.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue bus at left further to the viewer compared to blue matte bus at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f33cb40ea29f9ff.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.585, 0.677) (B) (0.337, 0.333)" }, { "from": "gpt", "value": "(A) (0.585, 0.677)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bae7e3f2d3d8035c.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of glassy black skyscraper at left in reference to gray glass skyscraper at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39bfaf8167c1687d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the gray asphalt road at lower left? Select from: (A) matte black map at right (B) white plastic sign at right" }, { "from": "gpt", "value": "(A) matte black map at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2951543a1ee71725.jpg", "conversations": [ { "from": "human", "value": "\nIs silvery water at center positioned before green textured tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f262a0f32114aacf.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the shiny black sedan at center? (A) shiny brown car at center (B) shiny silver sedan at center-left (C) shiny black sedan at center-left" }, { "from": "gpt", "value": "(B) shiny silver sedan at center-left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d505bbd64580c4ee.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white marble face at center in reference to blue water at lower left? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb40580d2c0c15eb.jpg", "conversations": [ { "from": "human", "value": "\nIs black fabric stroller at center positioned behind denim jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of denim jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0b8671141cb7e86.jpg", "conversations": [ { "from": "human", "value": "\nIs white smooth bell tower at center below green leafy palm tree at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, white smooth bell tower at center is located below green leafy palm tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba336cb249c419d4.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear glass window at center come in front of black granite countertop at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2607ed8fef5c0821.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the gray rough rock at center? (A) green leafy plant at upper center (B) gray rough concrete block at lower left" }, { "from": "gpt", "value": "(A) green leafy plant at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e2506abafd2ece1.jpg", "conversations": [ { "from": "human", "value": "\nIs black metal gate at center further to camera compared to blue fabric shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black metal gate at center is behind blue fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efea5ea33342a1d3.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.912, 0.750) (B) (0.940, 0.666)" }, { "from": "gpt", "value": "(A) (0.912, 0.750)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e48ce3f8542c3d46.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) black button-up shirt at center (B) knitted gray sweater at center (C) green silk scarf at center, is positioned closest to the floral dress at center?" }, { "from": "gpt", "value": "(C) green silk scarf at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77dff1db2d5d34f7.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte gray coat at left appear over black matte dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d11840efdb5f6f00.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green matte christmas tree at left located in relation to matte gold jacket at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/501694c9c6f7efca.jpg", "conversations": [ { "from": "human", "value": "\nDoes bare wood tree at left appear on the right side of green grassy field at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, bare wood tree at left is not to the right of green grassy field at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e490911a7d9bb86.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center further to camera compared to brown stone castle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07354b523586fa09.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte tree at left is thinner than wooden cabin at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green matte tree at left is thinner than wooden cabin at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b28cfdf59545f220.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) blue denim skirt at right (B) white matte bicycle at center" }, { "from": "gpt", "value": "(A) blue denim skirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8a297ee5af1e9e1.jpg", "conversations": [ { "from": "human", "value": "\nIs white snow-covered highway at center below white matte truck at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, white snow-covered highway at center is above white matte truck at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1264982560700b5d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) gold brocade robe at left (B) shiny red fabric dress at center (C) blue silk robe at center, is positioned closest to the glossy wooden table at center?" }, { "from": "gpt", "value": "(B) shiny red fabric dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36ad7520b2e562e3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black laptop at upper center is bigger than white paper at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte black laptop at upper center is larger in size than white paper at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/300ea59bb4ebff79.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray rock at center appear on the right side of blue clear water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, gray rock at center is positioned on the right side of blue clear water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c7e5c12db96fe77.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.144, 0.809) (B) (0.727, 0.211) (C) (0.321, 0.719) (D) (0.771, 0.519)" }, { "from": "gpt", "value": "(B) (0.727, 0.211)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed4544be238379d7.jpg", "conversations": [ { "from": "human", "value": "\nIs glossy lacquer teapot at center below glossy ceramic plate at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, glossy lacquer teapot at center is below glossy ceramic plate at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa39d8a9806a3242.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of smooth bark log at center and brown wooden cabin at center in the image provided, where is smooth bark log at center located with respect to brown wooden cabin at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d593bd0b5974999b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white lace scarf at center (B) white fuzzy coat at upper left (C) black wool coat at right" }, { "from": "gpt", "value": "(A) white lace scarf at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9fc2c5d2a5931bc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) matte black plate at center (B) green plaid shirt at center" }, { "from": "gpt", "value": "(A) matte black plate at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38f84c61c72ffa28.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.404, 0.089) (B) (0.392, 0.798) (C) (0.665, 0.466)" }, { "from": "gpt", "value": "(B) (0.392, 0.798)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/090c60e2616d707f.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray rough rock at center appear on the left side of white painted metal lighthouse at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, gray rough rock at center is to the right of white painted metal lighthouse at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/021703c6ef12a604.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the dark blue fabric shirt at center from the following options: (A) metallic wire-rimmed glasses at center (B) matte black glasses at center?" }, { "from": "gpt", "value": "(B) matte black glasses at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd22d4301fa2e6d9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) striped sweater at center (B) matte black shirt at left (C) matte black shirt at center, is positioned farthest from the white cotton shirt at lower left?" }, { "from": "gpt", "value": "(C) matte black shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e892ad9220704b7d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the green leafy at center? (A) green leafy lettuce at lower left (B) orange fabric person at center" }, { "from": "gpt", "value": "(B) orange fabric person at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9929ab181bbda91.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black hijab at left lie in front of dark blue fur at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte black hijab at left is in front of dark blue fur at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7d86b7c39f1c3b5.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte shirt at center positioned behind wooden table at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black matte shirt at center is behind wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e7186799bd1e04e.jpg", "conversations": [ { "from": "human", "value": "\nIs weathered wood at center in front of rusty wood log at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, weathered wood at center is in front of rusty wood log at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6cbfb701ff7a94f.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the white glossy projection screen at upper center? (A) green matte/blackboard at left (B) gray woolen sweater at center" }, { "from": "gpt", "value": "(A) green matte/blackboard at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10c6e8b99ef0f192.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.123, 0.325) (B) (0.058, 0.281)" }, { "from": "gpt", "value": "(A) (0.123, 0.325)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74cf953f52cf4ec8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) yellow metallic ski at center (B) brushed metal ski pole at left (C) brown wooden log cabin at center" }, { "from": "gpt", "value": "(B) brushed metal ski pole at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e8b3a5948cffaf8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) glossy black car at center (B) glossy black sports car at center (C) dark wood entertainment center at lower center" }, { "from": "gpt", "value": "(B) glossy black sports car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/874bb789346a68e7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the white smooth shirt at right? Choose among these: (A) yellow matte rice at lower right (B) white plastic bowl at lower center (C) gray checkered shirt at center" }, { "from": "gpt", "value": "(C) gray checkered shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73f9b9f08adbc75e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the wooden bench at right? (A) brown wooden table at center (B) wooden bench at center (C) black chalkboard at upper center (D) wooden at left" }, { "from": "gpt", "value": "(C) black chalkboard at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1217948a38cd2bf.jpg", "conversations": [ { "from": "human", "value": "\nIs brown branches at upper left above transparent plastic kite at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brown branches at upper left is above transparent plastic kite at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4a7488453a5ab8b.jpg", "conversations": [ { "from": "human", "value": "\nIs black velvet vest at center smaller than blue cotton shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3520fa0bb4bc11ae.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy water at center wider than tan fabric jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fe2574d8f51cf7c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) shiny brown spotted lizard at lower right (B) rough textured rock at upper center" }, { "from": "gpt", "value": "(A) shiny brown spotted lizard at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3c05d7f82624286.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte map at center bigger than blue fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green matte map at center has a larger size compared to blue fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/322689368d589496.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.533, 0.498) (B) (0.747, 0.875)" }, { "from": "gpt", "value": "(B) (0.747, 0.875)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1056f370521a06b.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the matte gray minivan at center among (A) white cotton dress at center (B) yellow cotton tank top at left (C) white foam surfboard at center (D) blue fabric shorts at center?" }, { "from": "gpt", "value": "(B) yellow cotton tank top at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4490b6f2dff573a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the shiny red apples at center? Select from: (A) white matte lab coat at center (B) smooth green apples at upper center" }, { "from": "gpt", "value": "(A) white matte lab coat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ed04b6c3a703aaa.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) green matte tree at center (B) white matte snow at center" }, { "from": "gpt", "value": "(B) white matte snow at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/732c4e279090d622.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the gray concrete path at center? Choose among these: (A) green leafy tree at center (B) yellowmaterial/texturesign at lower right" }, { "from": "gpt", "value": "(B) yellowmaterial/texturesign at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e18cd1cebc5aa2a8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.365, 0.889) (B) (0.346, 0.895)" }, { "from": "gpt", "value": "(A) (0.365, 0.889)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adc0b7d5f14959af.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) light brown fabric shirt at center (B) dark green fabric shirt at center (C) green painted wood cart at center (D) white matte shirt at center" }, { "from": "gpt", "value": "(D) white matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d6590b7f9a3d9df.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the paper calendar at upper center? (A) black fabric stethoscope at center (B) metallic silver stethoscope at center" }, { "from": "gpt", "value": "(B) metallic silver stethoscope at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e85b0b1094e09e40.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black cotton t-shirt at center is thinner than light gray wool coat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, black cotton t-shirt at center is not thinner than light gray wool coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e013f3922888277.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white smooth building at left is positioned above glassy steel skyscraper at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white smooth building at left is not above glassy steel skyscraper at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09b6337f92ad4347.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte cream refrigerator at right appear over white matte shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte cream refrigerator at right is located above white matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fffe519ee3cddd18.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.309, 0.780) (B) (0.566, 0.231)" }, { "from": "gpt", "value": "(A) (0.309, 0.780)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b492a1c6e970972a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.946, 0.131) (B) (0.578, 0.509) (C) (0.672, 0.786)" }, { "from": "gpt", "value": "(C) (0.672, 0.786)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a9c4e75c1aa9a9b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) brown wood pergola at center (B) blue smooth water at center" }, { "from": "gpt", "value": "(A) brown wood pergola at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a12610d50677cec.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black jacket at center is positioned below matte white blazer at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte black jacket at center is below matte white blazer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e10be4e4138b512.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is dull gray concrete path at center located relative to stone archway at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e92383ce180ae65.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.175, 0.298) (B) (0.893, 0.898)" }, { "from": "gpt", "value": "(B) (0.893, 0.898)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be71065908302c8b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) brown/dried leaves at right (B) brown textured tree at center" }, { "from": "gpt", "value": "(A) brown/dried leaves at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7dd0d66e96c2984e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brown wooden steps at right (B) brown matte water at lower center" }, { "from": "gpt", "value": "(B) brown matte water at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/318bfabdf7458ab5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) matte cream dress at center (B) white cotton shirt at center (C) white lace dress at lower left" }, { "from": "gpt", "value": "(C) white lace dress at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c8b70fb46fe5cb4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte black chair at center (B) white blinds at right" }, { "from": "gpt", "value": "(A) matte black chair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a8213e774390f4f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown dry leaves at center is positioned to the left of green leafy tree at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, brown dry leaves at center is not to the left of green leafy tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae7abbcf6077f25d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.658, 0.931) (B) (0.626, 0.831)" }, { "from": "gpt", "value": "(A) (0.658, 0.931)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be03078a795b436a.jpg", "conversations": [ { "from": "human", "value": "\nIs blue water at center bigger than smooth pebbles at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, blue water at center is bigger than smooth pebbles at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d98efa1ef5bcd948.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the orange plastic barricade at right among (A) orange mesh fence at left (B) smooth asphalt road at center?" }, { "from": "gpt", "value": "(B) smooth asphalt road at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0b1bc9ff03de8af.jpg", "conversations": [ { "from": "human", "value": "\nIs gold brocade robe at center bigger than gold lacquered statue at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, gold brocade robe at center is bigger than gold lacquered statue at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9db5a9ed91c19c9f.jpg", "conversations": [ { "from": "human", "value": "\nDoes black cotton t-shirt at right appear on the left side of matte brown backpack at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black cotton t-shirt at right is not on the left side of matte brown backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56968398674588ea.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.786, 0.486) (B) (0.252, 0.536) (C) (0.109, 0.572)" }, { "from": "gpt", "value": "(B) (0.252, 0.536)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc51c6ba53789238.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue leather jacket at left positioned before matte black microphone at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/246df8c40d0c6f53.jpg", "conversations": [ { "from": "human", "value": "\nDoes white striped shirt at center appear on the left side of purple fabric dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white striped shirt at center is positioned on the left side of purple fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6378d71c9e163e73.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the blue fabric shirt at upper center among (A) shiny red motorcycle at center (B) matte blue shirt at center?" }, { "from": "gpt", "value": "(B) matte blue shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd7d41a796b40d56.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black jacket at center lie in front of dark blue shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9a7c256f18ddb44.jpg", "conversations": [ { "from": "human", "value": "\nIs white fluffy snow at center below white matte car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c90f997232732325.jpg", "conversations": [ { "from": "human", "value": "\nIs clear blue water at center to the right of dark brown hair at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find clear blue water at center to the right of dark brown hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf7759e55d3a3338.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.795, 0.891) (B) (0.168, 0.286) (C) (0.001, 0.477) (D) (0.407, 0.322)" }, { "from": "gpt", "value": "(D) (0.407, 0.322)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bd2c505cfa8f73e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the white shirt at center? (A) blue plaid shirt at left (B) light blue sweatshirt at center (C) black matte sweatshirt at center" }, { "from": "gpt", "value": "(B) light blue sweatshirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d3156814bd8f3fd.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black asphalt runway at center located in relation to black matte pedestrian signal at left in the image? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee82c841cd610287.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if floral fabric dress at center is positioned above pink cotton shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, floral fabric dress at center is below pink cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b3853a756c1ef5b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the matte purple shirt at center? (A) green matte shirt at center (B) wooden park bench at center" }, { "from": "gpt", "value": "(B) wooden park bench at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89e97d5659b1f235.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.701, 0.459) (B) (0.753, 0.434)" }, { "from": "gpt", "value": "(B) (0.753, 0.434)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40b6dc80c4fef745.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark wood drawer at lower center lie in front of white matte mug at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c3d2e57f4820523.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) blue striped shirt at lower center (B) light gray cotton t-shirt at left (C) printed silk dress at right" }, { "from": "gpt", "value": "(A) blue striped shirt at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a612fda69a88b83.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric vest at center positioned in front of matte blue vest at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is behind matte blue vest at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58335a1de2a5bd85.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray concrete wall at lower right appear over gray concrete pavement at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, gray concrete wall at lower right is above gray concrete pavement at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2374a1cd9c07fb4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black leather jacket at lower left is positioned above gold textured clock at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1dcaace88b738ef.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the white striped shirt at center among (A) black plastic microphone at center (B) matte plastic map at upper center?" }, { "from": "gpt", "value": "(B) matte plastic map at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2e8746f6435a046.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte brown dress at left have a greater width compared to matte beige blazer at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, matte brown dress at left has a greater width compared to matte beige blazer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67c110dd9d6d2451.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.751, 0.673) (B) (0.525, 0.855)" }, { "from": "gpt", "value": "(B) (0.525, 0.855)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b394e1e5c6dc484f.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of pink shirt at left in relation to black foam microphone at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4bd837acc5a017e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) white smooth tarmac at center (B) white matte airplane at center" }, { "from": "gpt", "value": "(A) white smooth tarmac at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ded67f69b366e24b.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at upper center appear on the left side of rusty metal train car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green leafy tree at upper center is positioned on the left side of rusty metal train car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83b021f6a06b6356.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.399, 0.219) (B) (0.315, 0.217) (C) (0.415, 0.702)" }, { "from": "gpt", "value": "(C) (0.415, 0.702)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/818cf4d41f40849a.jpg", "conversations": [ { "from": "human", "value": "\nIs blue striped tie at center positioned before black plastic microphone at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10f2e66b8439a9da.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white checkered tablecloth at center (B) checkered fabric shirt at center (C) dark green sweater at center (D) matte gray shirt at center" }, { "from": "gpt", "value": "(C) dark green sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08b0f9cda23c41e2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte tree at left is smaller than green matte tree at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7bdf3f13bccd4986.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue matte shirt at center appear on the left side of black matte hoodie at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, blue matte shirt at center is to the left of black matte hoodie at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef37c5ac44d7656c.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of white matte shirt at lower right less distant than that of matte black camera at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39301f9ebdf84ca7.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden acoustic guitar at center smaller than black matte helmet at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, wooden acoustic guitar at center might be larger than black matte helmet at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/234308079624e950.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the black matte leotard at center among (A) matte black shorts at left (B) pink matte leotard at center (C) blue matte tank top at center (D) blue matte leotard at center?" }, { "from": "gpt", "value": "(A) matte black shorts at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a83d603df2bb43d7.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the matte black hatchback at left from the following options: (A) tan metallic car at center (B) yellow plastic license plate at center?" }, { "from": "gpt", "value": "(A) tan metallic car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8382f127113e2050.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.252, 0.720) (B) (0.555, 0.912)" }, { "from": "gpt", "value": "(A) (0.252, 0.720)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab7bbfb85443657d.jpg", "conversations": [ { "from": "human", "value": "\nIs white plastic chair at lower right above white fabric chair at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white plastic chair at lower right is not above white fabric chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79b894d01f1fbc18.jpg", "conversations": [ { "from": "human", "value": "\nIs silver metallic bicycle at left further to camera compared to purple matte helmet at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ef39b1a30bd7705.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.455, 0.527) (B) (0.755, 0.408)" }, { "from": "gpt", "value": "(B) (0.755, 0.408)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46a3a8d3a1f5d037.jpg", "conversations": [ { "from": "human", "value": "\nIs brushed metal trailer truck at lower left closer to the viewer compared to blurred white helmet at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30254a5f10ffbe53.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) hi-visibility fabric safety vest at center (B) orange reflective vest at center (C) orange reflective safety vest at center (D) high visibility vest at center" }, { "from": "gpt", "value": "(C) orange reflective safety vest at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2d8647faf282c6b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) black plastic pole at center (B) green leafy tree at upper center" }, { "from": "gpt", "value": "(A) black plastic pole at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1319ebb366828892.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of matte peach shirt at left in reference to white satin dress at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e81d79bb796a2db.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black penguin at center thinner than white matte penguin at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black penguin at center is not thinner than white matte penguin at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40a4fadb77c8f874.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green leafy tree at center more distant than that of sleek silver logo at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green leafy tree at center is in front of sleek silver logo at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51e31bd250f26d4d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) pleated satin dress at center (B) matte black cowboy hat at upper right" }, { "from": "gpt", "value": "(B) matte black cowboy hat at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/810cb2a254df7f08.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) blue matte laptop at center (B) matte white shirt at left (C) floral fabric headscarf at right" }, { "from": "gpt", "value": "(A) blue matte laptop at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fa7472a20439de1.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the thick green foliage at center from the following options: (A) thick green foliage at right (B) rugged rock canyon at center (C) dark green textured tree at right?" }, { "from": "gpt", "value": "(B) rugged rock canyon at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/063812ed1cfcb7ed.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) black metallic microphone at left (B) black matte suit at lower right (C) yellow striped tie at left (D) silver metallic microphone at upper left, is positioned closest to the black matte suit at center?" }, { "from": "gpt", "value": "(B) black matte suit at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aeae2d09bdad3bcc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cotton polo shirt at center is positioned above transparent plastic umbrella at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84639e792049e551.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) leather vest at center (B) graywool-likebeard at left" }, { "from": "gpt", "value": "(B) graywool-likebeard at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d261e474662869d2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.754, 0.667) (B) (0.280, 0.728) (C) (0.578, 0.444)" }, { "from": "gpt", "value": "(B) (0.280, 0.728)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6e74e5f8f28f2de.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is black matte shirt at center located relative to orange fabric dress at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29654554e8968e73.jpg", "conversations": [ { "from": "human", "value": "\nIs checkered fabric shirt at right to the left of matte black suit at left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, checkered fabric shirt at right is not to the left of matte black suit at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca7e4bc28c29788f.jpg", "conversations": [ { "from": "human", "value": "\nDoes concrete at center have a lesser width compared to gray fabric jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, concrete at center is thinner than gray fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13a804a8c9f1ce71.jpg", "conversations": [ { "from": "human", "value": "\nDoes blonde hair at center have a larger size compared to blonde hair at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, blonde hair at center is bigger than blonde hair at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d276b7bc75bb3009.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) golden fur dog at center (B) brown furry dog at upper right (C) wire mesh fence at center" }, { "from": "gpt", "value": "(A) golden fur dog at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/beaa6297f4ab60df.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.283, 0.742) (B) (0.617, 0.633)" }, { "from": "gpt", "value": "(A) (0.283, 0.742)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d137a245e9da445.jpg", "conversations": [ { "from": "human", "value": "\nIs striped knit hat at center above matte red sweater at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, striped knit hat at center is positioned over matte red sweater at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/719e9a5bae548fa9.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is smooth concrete train track at center located relative to metallic pole at left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/499b0e126b3cecbd.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white metal balcony at center (B) black rubber traffic cone at lower left (C) smooth stone column at center" }, { "from": "gpt", "value": "(A) white metal balcony at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58fe80868fb78f32.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) metallic gray microphone at upper left (B) pink lace dress at lower left (C) pink striped shirt at center (D) black plastic microphone at upper center" }, { "from": "gpt", "value": "(B) pink lace dress at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6bd58d7d6c59cfd.jpg", "conversations": [ { "from": "human", "value": "\nDoes denim jacket at left appear over brushed metal jacket at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, denim jacket at left is above brushed metal jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3dfcc5c67c641cc9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the black matte dress at center? Select from: (A) white knitted sweater at left (B) pink matte jacket at center (C) patterned fabric blouse at center (D) black wool coat at center" }, { "from": "gpt", "value": "(B) pink matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67b88d22d2710b80.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the black leather jacket at center from the following options: (A) dark gray asphalt parking lot at lower right (B) shiny blue car at lower right?" }, { "from": "gpt", "value": "(B) shiny blue car at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ec161f8d4766302.jpg", "conversations": [ { "from": "human", "value": "\nIs brown/dry wood tree at right to the right of weathered wood barn at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, brown/dry wood tree at right is positioned on the right side of weathered wood barn at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e02a9eb913c95e8.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the red brick clock tower at center? Choose from: (A) red brick church at center (B) matte red clock at center (C) glassy reflective skyscraper at right" }, { "from": "gpt", "value": "(C) glassy reflective skyscraper at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0a33c14603c2540.jpg", "conversations": [ { "from": "human", "value": "\nIs brown feathered goose at lower left positioned before brown feathered goose at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of brown feathered goose at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f50c355e0f3d1bfe.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth rock stream at center is smaller than green mossy tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, smooth rock stream at center occupies less space than green mossy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65d45f73bc7b6dd9.jpg", "conversations": [ { "from": "human", "value": "\nIs white fluffy goat at lower right smaller than light brown cotton shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/817905ed1940bf43.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is red matte jet ski at center located relative to white glossy sailboat at upper right? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/933b09b391517d49.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.542, 0.702) (B) (0.463, 0.309)" }, { "from": "gpt", "value": "(B) (0.463, 0.309)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/883019f4c4a97caa.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) camouflage fabric uniform at left (B) blue fleece jacket at right, is positioned farthest from the digital camouflage uniform at center?" }, { "from": "gpt", "value": "(A) camouflage fabric uniform at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06010a51d24998e9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dark brown leather jacket at lower left (B) blue fabric harness at center" }, { "from": "gpt", "value": "(A) dark brown leather jacket at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f107226a0dc5b4dd.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) green plastic boat at upper left (B) black matte snorkeling gear at lower left, is positioned closest to the red life vest at lower right?" }, { "from": "gpt", "value": "(B) black matte snorkeling gear at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03c310a40df617bc.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange shirt at center have a greater width compared to dark brown shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, orange shirt at center has a greater width compared to dark brown shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/611a3fff427bbe70.jpg", "conversations": [ { "from": "human", "value": "\nIs blue denim jeans at center to the right of light brown fabric dress at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, blue denim jeans at center is positioned on the right side of light brown fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/006141259fecc5b0.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the white cotton shirt at lower left? (A) floral fabric dress at lower left (B) white matte tank top at center" }, { "from": "gpt", "value": "(A) floral fabric dress at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ba439f2b5edb425.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the smooth suit jacket at upper right? Select from: (A) matte black coat at center (B) smooth leather hand at center" }, { "from": "gpt", "value": "(A) matte black coat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7b52f3000319a47.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green grass at center in relation to green plastic sign at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b87c55fdfc54988.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of white fur-covered stool at center in relation to white leather stool at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2d0a73b6fd181fe.jpg", "conversations": [ { "from": "human", "value": "\nDoes metallic gold costume at center appear over matte red shirt at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, metallic gold costume at center is positioned over matte red shirt at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a284bdc74e4db06b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.348, 0.698) (B) (0.078, 0.820) (C) (0.607, 0.570)" }, { "from": "gpt", "value": "(A) (0.348, 0.698)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ded88613feb06552.jpg", "conversations": [ { "from": "human", "value": "\nIs blue matte boat at center wider than blue glossy water at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, blue matte boat at center is wider than blue glossy water at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f544a86c2607a4c7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.197, 0.819) (B) (0.784, 0.305) (C) (0.203, 0.022)" }, { "from": "gpt", "value": "(C) (0.203, 0.022)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5209e69063d87efd.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the matte blue shirt at center? Choose from: (A) dark blue sweater at center (B) black leather chair at left (C) denim jeans at lower right (D) matte black laptop at left" }, { "from": "gpt", "value": "(D) matte black laptop at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c83be4e92a413666.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if beige fabric jacket at center is positioned to the right of yellow rubber microphone at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, beige fabric jacket at center is to the right of yellow rubber microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f7a23947cdb5fb4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the yellow cotton polo shirt at center? Choose among these: (A) black plastic sunglasses at center (B) gray matte shirt at center" }, { "from": "gpt", "value": "(A) black plastic sunglasses at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf6b05d6841223bb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden stool at center is positioned below smooth suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, wooden stool at center is located below smooth suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bc363229817e925.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown hair at center have a larger size compared to brown hair at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, dark brown hair at center is larger in size than brown hair at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/caedcde1f0fd8d38.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue fleece sweatshirt at center have a smaller size compared to shiny sequined costume at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, blue fleece sweatshirt at center is smaller than shiny sequined costume at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfbf21c2484ffc09.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue denim jeans at center is thinner than blue fleece jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, blue denim jeans at center might be wider than blue fleece jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77b2971016c817a6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic brass teapot at left is positioned below gold metallic teapot at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3ca9eeb3788ca0f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) yellow matte building at right (B) matte pink building at center (C) smooth water at center" }, { "from": "gpt", "value": "(C) smooth water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf3b85fee8fe40c2.jpg", "conversations": [ { "from": "human", "value": "\nDoes green mossy stream at center have a lesser width compared to gray rough rock at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green mossy stream at center is not thinner than gray rough rock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33890a4be5873181.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped sweater at center appear over yellow-green fabric jacket at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, striped sweater at center is positioned over yellow-green fabric jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6af3c45f5b5a0e6.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the matte gold shirt at center from the following options: (A) gold shiny sedan at center (B) gold metallic sedan at center (C) matte gold car at center?" }, { "from": "gpt", "value": "(B) gold metallic sedan at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c1537f8bcfd9908.jpg", "conversations": [ { "from": "human", "value": "\nIs dark clothing crowd at center bigger than smooth stone column at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, dark clothing crowd at center might be smaller than smooth stone column at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28e72dc2a3bea7a9.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green leafy tree at center located in relation to green matte tree at left in the image? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1746914c3a74bbd9.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white glossy cherub at center right (B) matte gray petals at left" }, { "from": "gpt", "value": "(A) white glossy cherub at center right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f0e6a198a8c0aff.jpg", "conversations": [ { "from": "human", "value": "\nDoes white plastic machine at center have a larger size compared to matte plastic monitor at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white plastic machine at center is bigger than matte plastic monitor at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71ef1ab630ef6fad.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green fleece jacket at center in relation to green fabric crowd at left? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c3e92d5c945b08d.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the autumn leaves at upper center among (A) purple matte jacket at center (B) purple fabric backpack at center (C) blue fabric backpack at center (D) matte black backpack at lower left?" }, { "from": "gpt", "value": "(A) purple matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e3fb2a515f1957f.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent nylon sock at lower center appear on the left side of matte red shoe at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find transparent nylon sock at lower center to the left of matte red shoe at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66799faa1b711830.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.624, 0.233) (B) (0.703, 0.512)" }, { "from": "gpt", "value": "(A) (0.624, 0.233)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/088864a96a4aa964.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the clear glass window at left among (A) green matte windshield at lower left (B) teal glossy car at left?" }, { "from": "gpt", "value": "(A) green matte windshield at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b53a7c18a6ee55b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if cloudy sky at upper center is positioned to the left of dark gray rocky mountains at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, cloudy sky at upper center is not on the left side of dark gray rocky mountains at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2e023317e69e5af.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) yellow satin dress at lower right (B) white t-shirt with graphic at center (C) reddish-orange denim jeans at center (D) dark green uniform at center" }, { "from": "gpt", "value": "(C) reddish-orange denim jeans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/120a6abb11935110.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) transparent plastic bottle at lower center (B) matte black jacket at left (C) translucent plastic bottle at left" }, { "from": "gpt", "value": "(A) transparent plastic bottle at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/638d336fc413cdf5.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth black hair at upper center have a lesser width compared to smooth scarf at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be6d589a99d5673b.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown shirt at center wider than striped cotton sweater at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7089429cdddbe5e9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the brown stone creek at lower left? Choose among these: (A) green leafy hillside at upper left (B) brown wooden hut at center (C) wooden hut at center" }, { "from": "gpt", "value": "(C) wooden hut at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c988cdde27cd5c8.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown meat at lower left thinner than satin silver sink at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, dark brown meat at lower left is thinner than satin silver sink at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91b538f5b130d235.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.658, 0.650) (B) (0.445, 0.658)" }, { "from": "gpt", "value": "(B) (0.445, 0.658)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53a0a598e98f4ec3.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.305, 0.533) (B) (0.145, 0.636) (C) (0.709, 0.319)" }, { "from": "gpt", "value": "(B) (0.145, 0.636)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ffb40babaaa66ab.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.227, 0.556) (B) (0.572, 0.866)" }, { "from": "gpt", "value": "(B) (0.572, 0.866)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fef092ccc0e7af6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if carved stone column at center is smaller than pink fabric jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, carved stone column at center is not smaller in size than pink fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/349a54530211cbf8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.981, 0.717) (B) (0.447, 0.506)" }, { "from": "gpt", "value": "(A) (0.981, 0.717)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d216031864a0dcb5.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray cotton t-shirt at center appear under shiny red train at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, gray cotton t-shirt at center is above shiny red train at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/360c220796fd23dc.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white matte soccer uniform at left (B) white net at center (C) blue jersey at center (D) white matte soccer uniform at center" }, { "from": "gpt", "value": "(B) white net at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c41caf8238a1f396.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.365, 0.611) (B) (0.796, 0.703)" }, { "from": "gpt", "value": "(A) (0.365, 0.611)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/707fcc34e42586f4.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.536, 0.869) (B) (0.577, 0.998)" }, { "from": "gpt", "value": "(B) (0.577, 0.998)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbfaf1ab7987cfae.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.271, 0.037) (B) (0.638, 0.625) (C) (0.238, 0.445) (D) (0.340, 0.436)" }, { "from": "gpt", "value": "(A) (0.271, 0.037)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb6a3e5c0b9b568b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) rocky gray mountain at center (B) green leafy tree at center (C) green leafy tree at left (D) green glossy tree at center" }, { "from": "gpt", "value": "(D) green glossy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2161eb98c4b25796.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.419, 0.455) (B) (0.315, 0.227) (C) (0.144, 0.583) (D) (0.165, 0.756)" }, { "from": "gpt", "value": "(B) (0.315, 0.227)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f05648a7e920c283.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of brown cotton t-shirt at center in reference to black hoodie at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cf439d71969bf08.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black plastic scissors at left is smaller than yellow matte tennis ball at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae2cebfbf3af1fd5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) soft green knit sweater at center (B) smooth black shirt at center" }, { "from": "gpt", "value": "(A) soft green knit sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24ceacd6e38e7986.jpg", "conversations": [ { "from": "human", "value": "\nIs silhouette bare tree at lower right to the left of green leafy tree at lower center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, silhouette bare tree at lower right is to the right of green leafy tree at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/641a68c032cda7d3.jpg", "conversations": [ { "from": "human", "value": "\nIs black henna tattoo at upper right bigger than white curly hair at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, black henna tattoo at upper right has a larger size compared to white curly hair at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d00b6b9a41050eb2.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte tree at center closer to camera compared to white powdery snow at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/898f6d6c6838c242.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) silver metallic truck at center (B) silver metallic trailer at center (C) metallic silver truck at lower right" }, { "from": "gpt", "value": "(B) silver metallic trailer at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e09a4d47becb39d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.305, 0.839) (B) (0.446, 0.675) (C) (0.345, 0.456) (D) (0.043, 0.723)" }, { "from": "gpt", "value": "(C) (0.345, 0.456)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d9778a3bcdb687b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green leafy tree at left (B) green leafy palm tree at upper center (C) green leafy tree at center" }, { "from": "gpt", "value": "(A) green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8871183fdc6bd803.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.145, 0.736) (B) (0.881, 0.823) (C) (0.389, 0.658)" }, { "from": "gpt", "value": "(A) (0.145, 0.736)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea98bebae9b949c7.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) blue matte shirt at center (B) orange backpack at left (C) striped fabric jacket at center" }, { "from": "gpt", "value": "(B) orange backpack at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c6d8fc784223194.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth water at center is positioned below silhouette wooden boat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, smooth water at center is not below silhouette wooden boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d11c2e8f6c74519d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte shirt at center is positioned above light skin tone flesh at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, black matte shirt at center is located above light skin tone flesh at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ea5555659571648.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the matte black belly at center? (A) black matte shirt at upper center (B) pink matte shirt at center" }, { "from": "gpt", "value": "(A) black matte shirt at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a349044eb088d5b5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) matte black minifigure at left (B) wooden table at center" }, { "from": "gpt", "value": "(B) wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cdf9f9faadbb4183.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.566, 0.720) (B) (0.793, 0.978)" }, { "from": "gpt", "value": "(A) (0.566, 0.720)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/719d31fc27e62b87.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white matte table at right in reference to wooden table at left? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ae7f8ca1489a9ae.jpg", "conversations": [ { "from": "human", "value": "\nIs white stone lion at lower left above dark gray stone door at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white stone lion at lower left is positioned over dark gray stone door at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f140e63a5c1e64c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.912, 0.159) (B) (0.514, 0.620) (C) (0.190, 0.391)" }, { "from": "gpt", "value": "(B) (0.514, 0.620)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd8c0d44f9704a82.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light brown sandy beach at lower left is bigger than clear blue water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, light brown sandy beach at lower left is not bigger than clear blue water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/908ae2e86209d999.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte white tank top at lower left located in relation to blue plastic chair at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f1558922fe70219.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.374, 0.698) (B) (0.326, 0.106)" }, { "from": "gpt", "value": "(A) (0.374, 0.698)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8ee4a85adb5cc4a.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth concrete pole at left appear over red stop sign at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, smooth concrete pole at left is below red stop sign at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/023ff4c44038cd00.jpg", "conversations": [ { "from": "human", "value": "\nIs matte white van at center further to camera compared to metallic blue car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte white van at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39cd1d15c226ecb1.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.265, 0.941) (B) (0.370, 0.492) (C) (0.469, 0.628)" }, { "from": "gpt", "value": "(B) (0.370, 0.492)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/008d662cd9d85caf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.332, 0.447) (B) (0.530, 0.420) (C) (0.467, 0.414) (D) (0.757, 0.703)" }, { "from": "gpt", "value": "(C) (0.467, 0.414)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ea27cae29329ed8.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the blue fleece jacket at lower center? (A) red plastic ski pole at center (B) green matte jacket at center" }, { "from": "gpt", "value": "(A) red plastic ski pole at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbaf3d393713577b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.810, 0.848) (B) (0.376, 0.133) (C) (0.370, 0.806) (D) (0.738, 0.750)" }, { "from": "gpt", "value": "(B) (0.376, 0.133)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff2e24ed1ea8a494.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.480, 0.616) (B) (0.689, 0.636)" }, { "from": "gpt", "value": "(A) (0.480, 0.616)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/959410b0d10223cc.jpg", "conversations": [ { "from": "human", "value": "\nIs white stone church at center bigger than metallic spire at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e3a5a4666f888cc.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black car at left to the right of white matte car at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte black car at left is not on the right side of white matte car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1dbc568e62f11645.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black laptop at center have a smaller size compared to silver metallic laptop at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6dce0f11822569da.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the blue camouflage uniform at lower left? Choose from: (A) denim jeans at left (B) blue denim jeans at center" }, { "from": "gpt", "value": "(A) denim jeans at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9171b93213978e54.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of camouflage pants at center in relation to green fabric harness at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c61991df6eeb41f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.057, 0.822) (B) (0.992, 0.164)" }, { "from": "gpt", "value": "(A) (0.057, 0.822)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3106c05a67f5003.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) matte cardboard box at center (B) white fabric at upper right" }, { "from": "gpt", "value": "(B) white fabric at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e5cff82a868ebf1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) blue printed shorts at center (B) blue textured shorts at upper right (C) pink fabric swimsuit at center" }, { "from": "gpt", "value": "(C) pink fabric swimsuit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7d1e353264c3569.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white smooth podium at center is bigger than black matte microphone at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white smooth podium at center is bigger than black matte microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e523d0d32147ff22.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) blue jersey at center (B) yellow matte jersey at center (C) green grass at center" }, { "from": "gpt", "value": "(C) green grass at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37eeadccfcbb5839.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the white matte shirt at center among (A) wooden at center (B) whiteboard at upper center (C) black plastic fan at left?" }, { "from": "gpt", "value": "(A) wooden at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08e685dc250f2530.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grassy wheat field at center is thinner than green leafy palm tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green grassy wheat field at center has a lesser width compared to green leafy palm tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ba1fe2e210a3277.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the leopard print hat at center? (A) brown leather hat at lower left (B) black speckled pavement at center" }, { "from": "gpt", "value": "(A) brown leather hat at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b194384e8e8e72a2.jpg", "conversations": [ { "from": "human", "value": "\nIs gray stone church at center below striped fabric dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1569eb110152bccf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.722, 0.920) (B) (0.095, 0.637) (C) (0.464, 0.523)" }, { "from": "gpt", "value": "(C) (0.464, 0.523)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a3fbd03daac1271.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the black matte whale at center from the following options: (A) blue paper seal at center (B) pink matte heart at center?" }, { "from": "gpt", "value": "(A) blue paper seal at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf9d8b4668a0740e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.851, 0.597) (B) (0.496, 0.472) (C) (0.492, 0.648) (D) (0.179, 0.198)" }, { "from": "gpt", "value": "(C) (0.492, 0.648)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72b1692d7e6a916e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.848, 0.416) (B) (0.020, 0.544) (C) (0.686, 0.419) (D) (0.203, 0.298)" }, { "from": "gpt", "value": "(A) (0.848, 0.416)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c408e64eef764da2.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center bigger than wooden cabin at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, green leafy tree at center is larger in size than wooden cabin at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe612d9b137ff448.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.821, 0.403) (B) (0.701, 0.386)" }, { "from": "gpt", "value": "(A) (0.821, 0.403)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8096dc67d4c71ce7.jpg", "conversations": [ { "from": "human", "value": "\nIs matte white shirt at center positioned before matte brown hat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte white shirt at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6c79512cd9748a7.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white glossy shirt at center (B) black matte jacket at left" }, { "from": "gpt", "value": "(B) black matte jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06cad3e63fe2b073.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black swimsuit at center have a greater width compared to white feathered bird at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, matte black swimsuit at center has a greater width compared to white feathered bird at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0dd491984913823e.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny metallic bicycle at center have a greater width compared to matte black helmet at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of shiny metallic bicycle at center exceeds that of matte black helmet at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d04a3cecf55fc0b.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black monitor at center have a smaller size compared to matte black monitor at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, matte black monitor at center has a smaller size compared to matte black monitor at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fe2386a8ab5bb03.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the matte black sedan at center? (A) shiny chrome motorbike at center (B) silver metallic hatchback at center" }, { "from": "gpt", "value": "(A) shiny chrome motorbike at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/622a436e3dc4a417.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white matte van at center located relative to blonde hair at upper center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06d6c0e7caa54b65.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.466, 0.659) (B) (0.579, 0.625)" }, { "from": "gpt", "value": "(B) (0.579, 0.625)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b2d12a207295a46.jpg", "conversations": [ { "from": "human", "value": "\nDoes sandy beige dunes at lower left have a lesser width compared to matte black jacket at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, sandy beige dunes at lower left is not thinner than matte black jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d70a6bed9149d938.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red book at center positioned in front of matte red book at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte red book at center is behind matte red book at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29f998bf10797ef1.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the shiny brown nori at center among (A) nail polish at center (B) smooth skin hand at center?" }, { "from": "gpt", "value": "(B) smooth skin hand at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60418d278f8fbf98.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.324, 0.597) (B) (0.941, 0.944)" }, { "from": "gpt", "value": "(B) (0.941, 0.944)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8a293b5365ad58f.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic gray clock at center positioned behind metallic cross at top? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03846191f051b3cc.jpg", "conversations": [ { "from": "human", "value": "\nIs blue cotton shirt at center above blue smooth shirt at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef64ce1671d69985.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is dark gray shirt at left located relative to dark gray backpack at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9b8f0425fb2c6b5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.641, 0.384) (B) (0.417, 0.348) (C) (0.342, 0.239) (D) (0.314, 0.170)" }, { "from": "gpt", "value": "(C) (0.342, 0.239)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d38fa35e90ee761.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange satin dress at center appear on the right side of white tulle dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, orange satin dress at center is to the right of white tulle dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04e96a242fd3ee7a.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte smartphone at center thinner than black matte video player at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, black matte smartphone at center might be wider than black matte video player at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5db6aadd0385a8a0.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black car at lower left have a greater width compared to metallic red truck at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black car at lower left is not wider than metallic red truck at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6eb5815a1c4c105c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown sandy dirt at center is positioned below metal mesh fence at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, brown sandy dirt at center is located below metal mesh fence at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae3fa438af71a77b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white cotton tank top at center (B) brown sandy beach at lower center (C) blue water at lower center" }, { "from": "gpt", "value": "(C) blue water at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19ab4f2a512dc2f9.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.848, 0.495) (B) (0.593, 0.500)" }, { "from": "gpt", "value": "(A) (0.848, 0.495)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b96b44734131946.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of striped cotton shirt at center and white wood bar stool at left in the image provided, where is striped cotton shirt at center located with respect to white wood bar stool at left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c5d0e097c8eaab8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if denim jacket at center is positioned above transparent purple umbrella at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, denim jacket at center is positioned over transparent purple umbrella at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1083af9ec367fc73.jpg", "conversations": [ { "from": "human", "value": "\nDoes black velvet cape at lower right have a larger size compared to brown leather vest at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black velvet cape at lower right is not bigger than brown leather vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6528b75805e59057.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at center is positioned above gray concrete ledge at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2953272f649c477.jpg", "conversations": [ { "from": "human", "value": "\nIs brown woven fabric at left closer to the viewer compared to brown woven mat at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, brown woven fabric at left is behind brown woven mat at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fec7cc30aee14cc0.jpg", "conversations": [ { "from": "human", "value": "\nIs blue liquid water at upper left thinner than green leafy hillside at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16f4386e4b1317a5.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of matte ceramic mug at center less distant than that of white glossy shelf at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f58e54c7a0dda11.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) clear glass window at upper center (B) transparent glass window at center, is positioned closest to the wooden chair at center?" }, { "from": "gpt", "value": "(B) transparent glass window at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25d738bd7d948662.jpg", "conversations": [ { "from": "human", "value": "\nDoes earthenware bowl at center lie behind silver metallic spoon at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, earthenware bowl at center is in front of silver metallic spoon at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/907ccf3208987304.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is wooden table at center located relative to white paper sign at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9482203bcdc28f7.jpg", "conversations": [ { "from": "human", "value": "\nIs white canvas shoe at lower center to the right of white canvas shoe at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white canvas shoe at lower center is not on the right side of white canvas shoe at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85f49ed8d1826f52.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black backpack at center below plaid shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da1f8c252cc1da5d.jpg", "conversations": [ { "from": "human", "value": "\nDoes camouflage fabric sleeping bag at center come in front of camouflage fabric person at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, camouflage fabric sleeping bag at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0adc230a34fa60f1.jpg", "conversations": [ { "from": "human", "value": "\nDoes bright white teeth at center appear on the left side of matte black mouth at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, bright white teeth at center is not to the left of matte black mouth at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6647a49e91adb817.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the camouflage pants at center? Choose among these: (A) orange fabric shirt at upper right (B) pink matte bow at center" }, { "from": "gpt", "value": "(A) orange fabric shirt at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23eb657cfe219af5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.030, 0.669) (B) (0.420, 0.486)" }, { "from": "gpt", "value": "(B) (0.420, 0.486)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/013108b1615a66a8.jpg", "conversations": [ { "from": "human", "value": "\nIs green mossy branch at upper center wider than green leafy palm at center-right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/408d732067d6529d.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown shirt at center closer to camera compared to speckled fur dog at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is behind speckled fur dog at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/044218756e6fdccd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.617, 0.573) (B) (0.681, 0.584)" }, { "from": "gpt", "value": "(B) (0.681, 0.584)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce2a229e21895da1.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is brown smooth dog at center located relative to brown furry dog at lower right? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3dc66cfbe1e2b66.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the green leafy tree at center? Choose from: (A) green leafy tree at upper right (B) brown brick building at center (C) metallic pole at center (D) satin silver pole at center" }, { "from": "gpt", "value": "(C) metallic pole at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/221a72a38a3082df.jpg", "conversations": [ { "from": "human", "value": "\nIs white paper at center to the right of pink fabric purse at left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white paper at center is to the right of pink fabric purse at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c65bb8bf69c15992.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the green fabric flag at upper center? Select from: (A) green velvet robe at center (B) green fabric horse at center" }, { "from": "gpt", "value": "(B) green fabric horse at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92e3ebaaf6c181c5.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the matte black jacket at lower right among (A) matte black jacket at center (B) smooth leather jacket at upper left?" }, { "from": "gpt", "value": "(A) matte black jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c019ac5d2646b2eb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden door at center is positioned to the left of stone plaque at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, wooden door at center is not to the left of stone plaque at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04f1f5e47ed1f7ff.jpg", "conversations": [ { "from": "human", "value": "\nIs dark purple dress at center to the right of matte black jacket at upper left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, dark purple dress at center is positioned on the right side of matte black jacket at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/869803fc6c329486.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink satin hijab at center appear on the left side of blue fabric shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, pink satin hijab at center is to the right of blue fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00a0fd8177a1db74.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) green leafy tree at upper right (B) green leafy tree at right" }, { "from": "gpt", "value": "(A) green leafy tree at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a8d9f196ecfe043.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the snowy mountain at center? (A) matte black goggles at center (B) light gray waterproof jacket at center" }, { "from": "gpt", "value": "(B) light gray waterproof jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76ca747f7852e369.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of multicolored fabric bikini top at center in relation to multicolored plastic goggles at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e72c6a89e554a216.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the camouflage fabric uniform at right? Choose among these: (A) camouflage fabric uniform at center (B) camouflage fabric uniform at left (C) camouflage fabric at center" }, { "from": "gpt", "value": "(C) camouflage fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b61f95a25185ed5c.jpg", "conversations": [ { "from": "human", "value": "\nDoes rusty rock pile at center appear on the right side of brown cotton t-shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, rusty rock pile at center is not to the right of brown cotton t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a81c2e393d1d38a4.jpg", "conversations": [ { "from": "human", "value": "\nDoes white concrete building at upper right appear over white glass building at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da32dc7efbe1f842.jpg", "conversations": [ { "from": "human", "value": "\nDoes light blue cotton shirt at center have a greater width compared to gold metallic ring at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4e45ae627ee8970.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte jeans at center thinner than denim jeans at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white matte jeans at center's width is not less than denim jeans at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fe1c7659224c5ab.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver metallic stereo at center appear over black plastic stereo at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, silver metallic stereo at center is not positioned above black plastic stereo at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/162671e8d1e6ff2a.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy plant at left further to the viewer compared to clear glass window at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/718d10d43f747ea1.jpg", "conversations": [ { "from": "human", "value": "\nIs stone textured stairs at center behind matte glass streetlamp at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eafbba8a4e79e16c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.353, 0.175) (B) (0.004, 0.866)" }, { "from": "gpt", "value": "(B) (0.004, 0.866)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/392076b6ae1a9833.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.590, 0.448) (B) (0.529, 0.836)" }, { "from": "gpt", "value": "(B) (0.529, 0.836)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4df4023f904f0684.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green matte parrot at center (B) white matte pole at left" }, { "from": "gpt", "value": "(A) green matte parrot at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/052b85d13b4e38bc.jpg", "conversations": [ { "from": "human", "value": "\nIs black mesh/synthetic salomon shoe at center to the right of black fabric hand at lower left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, black mesh/synthetic salomon shoe at center is positioned on the right side of black fabric hand at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/060d35ad923ab430.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is brown fuzzy squirrel at lower left located relative to brown fuzzy squirrel at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08fad3be6930d46c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.547, 0.478) (B) (0.791, 0.953) (C) (0.049, 0.281)" }, { "from": "gpt", "value": "(B) (0.791, 0.953)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ee8dd1257bf38f5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) striped cotton shirt at center (B) smooth skin handshake at center" }, { "from": "gpt", "value": "(A) striped cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/127b880d1e647bc9.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark gray stone church at center located in relation to dark gray stone tower at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4906d84ac3cb492b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) clear glass wine glass at left (B) clear glass wine glass at upper left (C) clear glass wine glass at center (D) white cloth-covered table at center" }, { "from": "gpt", "value": "(C) clear glass wine glass at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97bfd32731bb1a54.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the sepia textured mountain at center from the following options: (A) green matte trees at lower left (B) golden textured sky at upper center?" }, { "from": "gpt", "value": "(B) golden textured sky at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8fe1e1a9d47c293.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) green textured cypress tree at upper center (B) green leafy cypress at upper center" }, { "from": "gpt", "value": "(A) green textured cypress tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e09efe8a11253ef1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.728, 0.581) (B) (0.205, 0.675)" }, { "from": "gpt", "value": "(A) (0.728, 0.581)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0d1ab45f76cf9e8.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown hair at lower center appear on the right side of smooth black shirt at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brown hair at lower center is to the right of smooth black shirt at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29d060a4677a9cb7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) shiny blue fabric dress at center (B) shiny multicolored skirt at center" }, { "from": "gpt", "value": "(B) shiny multicolored skirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae0be11757643b1b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) metallic silver guitar at center (B) natural wood acoustic guitar at center (C) red matte shirt at right" }, { "from": "gpt", "value": "(A) metallic silver guitar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d38b6aa146973b3.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny silver necklace at upper right appear over white plastic hoop at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, shiny silver necklace at upper right is not above white plastic hoop at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b45f652277464e2e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) velvet/cloth mannequin at upper left (B) sparkly purple fabric at center" }, { "from": "gpt", "value": "(B) sparkly purple fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49202c46f30aba05.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the glossy blue balloon at center? Choose among these: (A) light gray fleece jacket at center (B) striped shirt at center (C) fluffy brown teddy bear at center (D) white fuzzy coat at lower center" }, { "from": "gpt", "value": "(C) fluffy brown teddy bear at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b60c23b449ad9c3.jpg", "conversations": [ { "from": "human", "value": "\nDoes rusty metal bridge at center have a smaller size compared to metallic gray boat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be0eba0478d42543.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.078, 0.828) (B) (0.883, 0.988) (C) (0.358, 0.173)" }, { "from": "gpt", "value": "(B) (0.883, 0.988)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75b53f0656617504.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.517, 0.397) (B) (0.431, 0.362) (C) (0.995, 0.650)" }, { "from": "gpt", "value": "(A) (0.517, 0.397)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f30f206eb4287d0d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) woven multicolored basket at center (B) woven wood basket at lower left" }, { "from": "gpt", "value": "(A) woven multicolored basket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b63f5e83e02f9d0.jpg", "conversations": [ { "from": "human", "value": "\nDoes gravel at center come behind stone church at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, gravel at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be448aad07fbbf91.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.125, 0.839) (B) (0.852, 0.734)" }, { "from": "gpt", "value": "(A) (0.125, 0.839)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7dea4b065e7631c.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte stormtrooper helmet at center bigger than white matte stormtrooper at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white matte stormtrooper helmet at center is not larger than white matte stormtrooper at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b9ad12be444dbe0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.970, 0.134) (B) (0.200, 0.822) (C) (0.957, 0.702)" }, { "from": "gpt", "value": "(B) (0.200, 0.822)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb77edf0b1b6aa04.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.145, 0.805) (B) (0.253, 0.741)" }, { "from": "gpt", "value": "(A) (0.145, 0.805)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffb9a5dc02e75444.jpg", "conversations": [ { "from": "human", "value": "\nIs light brown fabric guitar at center closer to the viewer compared to matte black guitar at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1b7e303700bc8ec.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the green leafy tree at right? Choose from: (A) green leafy tree at center (B) green reflective water at center" }, { "from": "gpt", "value": "(A) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15953cf5858b2755.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray textured stingray at center positioned before shiny yellow fish at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, dark gray textured stingray at center is in front of shiny yellow fish at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5be5533c3c4aae54.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.475, 0.163) (B) (0.958, 0.295) (C) (0.903, 0.075)" }, { "from": "gpt", "value": "(B) (0.958, 0.295)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a2f4e9411b8aebf.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the matte black camera at center? (A) black wool coat at center (B) dark gray leather jacket at center (C) knitted wool scarf at center (D) polka dot scarf at center" }, { "from": "gpt", "value": "(B) dark gray leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8dcc6fbd81fc52d3.jpg", "conversations": [ { "from": "human", "value": "\nIs light gray fabric shirt at lower left further to camera compared to shiny brown wood at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of shiny brown wood at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed4e1a1e50fa6493.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) white dotted apron at center (B) floral fabric apron at left (C) floral fabric apron at center (D) white glossy exhaust hood at upper center, is positioned farthest from the white dotted apron at lower center?" }, { "from": "gpt", "value": "(D) white glossy exhaust hood at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fb8135dfd68f5b7.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the matte black face at center? (A) pink glossy lipstick at center (B) matte pink lips at center (C) matte yellow tank top at center" }, { "from": "gpt", "value": "(B) matte pink lips at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72290079eef9cee1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the blue fabric chair at lower center? Select from: (A) green glass bottle at left (B) hardcover book at center (C) white paper book at lower left (D) matte brown shirt at center" }, { "from": "gpt", "value": "(A) green glass bottle at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16d92ea461f80f8e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dirt at center is positioned below gray rocky mountain at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, dirt at center is located below gray rocky mountain at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b12f9ece86babb23.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black and white printed dress at center is thinner than pearl necklace at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, black and white printed dress at center might be wider than pearl necklace at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d5003465755cf64.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.701, 0.577) (B) (0.562, 0.606) (C) (0.083, 0.787)" }, { "from": "gpt", "value": "(C) (0.083, 0.787)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e60918247eeb6c1.jpg", "conversations": [ { "from": "human", "value": "\nIs black fleece hoodie at center bigger than smooth brown bark at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c4fe6d90f044914.jpg", "conversations": [ { "from": "human", "value": "\nIs white snow-covered tree at center positioned at the back of white snow-covered tree at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white snow-covered tree at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93a07fb5b01395c9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) snowy white hillside at lower left (B) snow-covered branches at upper center" }, { "from": "gpt", "value": "(A) snowy white hillside at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63c463f64923f942.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.194, 0.119) (B) (0.530, 0.778)" }, { "from": "gpt", "value": "(A) (0.194, 0.119)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01da8018c4ee07bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.271, 0.747) (B) (0.894, 0.930) (C) (0.559, 0.411)" }, { "from": "gpt", "value": "(B) (0.894, 0.930)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8672ac8d8c12f46c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.399, 0.614) (B) (0.095, 0.211)" }, { "from": "gpt", "value": "(B) (0.095, 0.211)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9e430be0afb590e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grassy field at lower center is bigger than stone church at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8efe49cca8796898.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte tree at left appear on the right side of yellow-green leaves at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, green matte tree at left is to the left of yellow-green leaves at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbbf2d433b96d43d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white matte sweatshirt at lower left (B) gray cobblestone pavement at lower right" }, { "from": "gpt", "value": "(B) gray cobblestone pavement at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/045b5f7f4138d671.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) silver metallic monitor at center (B) matte silver laptop at right (C) matte black monitor at left" }, { "from": "gpt", "value": "(B) matte silver laptop at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f13e6c90048b0de4.jpg", "conversations": [ { "from": "human", "value": "\nDoes white lace dress at center appear on the right side of light gray pinstripe suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, white lace dress at center is to the left of light gray pinstripe suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54aedb2d789175c5.jpg", "conversations": [ { "from": "human", "value": "\nIs maroon leather book at center positioned before matte black glasses at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/706a23d2e0d9c718.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at upper left have a larger size compared to green leafy tree at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abfc327d6af85d66.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) black zip-up hoodie at center (B) dark blue hoodie at center" }, { "from": "gpt", "value": "(B) dark blue hoodie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17047e1e650b6c2b.jpg", "conversations": [ { "from": "human", "value": "\nIs brown dry grass at center thinner than green grassy hill at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, brown dry grass at center has a lesser width compared to green grassy hill at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c71691d304f637da.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray matte steering wheel at upper left is wider than black plastic speaker at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, gray matte steering wheel at upper left might be narrower than black plastic speaker at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1bc01ddec1d1bbd5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.589, 0.402) (B) (0.624, 0.530) (C) (0.657, 0.459) (D) (0.608, 0.373)" }, { "from": "gpt", "value": "(A) (0.589, 0.402)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e45837c2f7f17cd.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) greenish water at lower center (B) light brown wooden boat at lower center" }, { "from": "gpt", "value": "(A) greenish water at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41c843a337007918.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) gold metallic earrings at right (B) gold/textured metal teardrop-shaped earring at ear" }, { "from": "gpt", "value": "(B) gold/textured metal teardrop-shaped earring at ear" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94d8c71efc997899.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte camera at upper center below blue fabric shorts at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white matte camera at upper center is below blue fabric shorts at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18a78ffc0aef56da.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of white lace headscarf at upper right in relation to dark brown matte hair at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5cd8d76f8287950.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny black crocodile at center is positioned to the left of shiny dark green crocodile at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, shiny black crocodile at center is positioned on the left side of shiny dark green crocodile at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfae50e69fc8aa65.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.682, 0.784) (B) (0.237, 0.325)" }, { "from": "gpt", "value": "(B) (0.237, 0.325)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9baaf7d85e6888ac.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the shiny black dog at upper left? Choose among these: (A) velvety red blanket at upper center (B) black fur dog at center" }, { "from": "gpt", "value": "(A) velvety red blanket at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb9a7a6d72c3ea34.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the pink cotton shirt at center? (A) blue matte hijab at center (B) white cotton robe at center (C) beige fabric chair at center" }, { "from": "gpt", "value": "(C) beige fabric chair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1edea91ca40028c.jpg", "conversations": [ { "from": "human", "value": "\nIs autumn leaves at upper right to the left of reddish-brown textured tree at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, autumn leaves at upper right is not on the left side of reddish-brown textured tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30198e99fc7145d5.jpg", "conversations": [ { "from": "human", "value": "\nIs asphalt road at center further to the viewer compared to black canvas shoes at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of black canvas shoes at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cfd428e77c460b2.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black bobblehead at center further to camera compared to white plastic crown at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of white plastic crown at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2986cb1dc993a29.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent glass at upper right below matte brown sandwich at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cefa5066957e699a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green leafy tree at right (B) white fluffy cloud at upper center (C) bare wood tree at center" }, { "from": "gpt", "value": "(B) white fluffy cloud at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb7bb16e74e22218.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.524, 0.894) (B) (0.586, 0.856)" }, { "from": "gpt", "value": "(A) (0.524, 0.894)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/143eae7dd1801613.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.081, 0.502) (B) (0.784, 0.850)" }, { "from": "gpt", "value": "(B) (0.784, 0.850)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e97f886bfd20fdf8.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is green leafy hedge at center located relative to green hedge at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7ab29b7a7fd7e3b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) blue uniformed man at center (B) light brown fabric bag at lower left" }, { "from": "gpt", "value": "(B) light brown fabric bag at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e3667af395cb8af.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.542, 0.391) (B) (0.855, 0.111) (C) (0.285, 0.891)" }, { "from": "gpt", "value": "(C) (0.285, 0.891)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d5d4c25014db494.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) matte black glasses at left (B) matte black dress at center (C) pearl and beaded necklace at center (D) pink beaded necklace at center" }, { "from": "gpt", "value": "(A) matte black glasses at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2507cf12012d69ca.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the white matte uniform at center? Choose from: (A) blue fabric astronaut at left (B) blue fabric jacket at center" }, { "from": "gpt", "value": "(B) blue fabric jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e33015025df826f1.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray rocky mountain at upper center have a larger size compared to green leafy palm at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, gray rocky mountain at upper center has a larger size compared to green leafy palm at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7742ab82255d5291.jpg", "conversations": [ { "from": "human", "value": "\nIs brown rough rock at center below clear blue water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brown rough rock at center is below clear blue water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ac184004cc019dc.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte skin at left located relative to embroidered denim baseball cap at upper right? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a77401b7502670a3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the high-visibility yellow reflective jacket at center? Choose among these: (A) neon yellow reflective vest at center (B) white matte suv at center (C) neon yellow reflective safety vest at center" }, { "from": "gpt", "value": "(A) neon yellow reflective vest at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d595263b8029134d.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear water at center appear over white matte ferry at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2cb85aab4f889b15.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.525, 0.473) (B) (0.050, 0.423)" }, { "from": "gpt", "value": "(A) (0.525, 0.473)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d35d7f3efaa5f08.jpg", "conversations": [ { "from": "human", "value": "\nDoes white wooden bookshelf at center have a greater width compared to black fabric backpack at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white wooden bookshelf at center has a greater width compared to black fabric backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c44a1dd07d269861.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.635, 0.373) (B) (0.054, 0.928)" }, { "from": "gpt", "value": "(B) (0.054, 0.928)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfc4ece458d42bfd.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white matte pants at lower left (B) metallic gray bridge at upper center" }, { "from": "gpt", "value": "(A) white matte pants at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83832824a174405a.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the white marble statue at center from the following options: (A) white fabric bag at center (B) white marble reclining figure at left?" }, { "from": "gpt", "value": "(B) white marble reclining figure at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf1b882d3bc605ab.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy bank at lower left wider than green grassy hillside at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green grassy bank at lower left has a greater width compared to green grassy hillside at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac038ad662649baf.jpg", "conversations": [ { "from": "human", "value": "\nDoes green reflective water at center lie in front of green leafy tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is behind green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24ac7cdbaeb4dd88.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.555, 0.439) (B) (0.446, 0.703)" }, { "from": "gpt", "value": "(A) (0.555, 0.439)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ceda00db108153ce.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) gray cotton t-shirt at left (B) white plaid shirt at center (C) floral fabric dress at center" }, { "from": "gpt", "value": "(A) gray cotton t-shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bed094067ef3416.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue woolen coat at center appear under white fabric mask at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, blue woolen coat at center is located below white fabric mask at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d36e9a57efba661.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if camouflage uniform at center is positioned to the right of blue cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, camouflage uniform at center is not to the right of blue cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9b5b902a0cc9fa4.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray textured crocodile at upper left to the right of dark gray scaly crocodile at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, dark gray textured crocodile at upper left is positioned on the right side of dark gray scaly crocodile at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2e2db8b022bce87.jpg", "conversations": [ { "from": "human", "value": "\nIs dark blue sweater at center above blue denim shirt at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, dark blue sweater at center is not positioned above blue denim shirt at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a5c8d7015dbb5ef.jpg", "conversations": [ { "from": "human", "value": "\nIs blue water at lower center behind white glossy boat at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ecefb4dedf8a5ba3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the blue matte plastic horse at center? (A) white cotton shirt at upper right (B) yellow plastic swing at upper left" }, { "from": "gpt", "value": "(A) white cotton shirt at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5051f990b738acf1.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black tank top at center closer to the viewer compared to light pink skin at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black tank top at center is in front of light pink skin at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b499adc8d13bf24.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) white plastic cutting board at lower left (B) white translucent bowl at center" }, { "from": "gpt", "value": "(B) white translucent bowl at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eff12fff67d8dd46.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.372, 0.659) (B) (0.148, 0.708) (C) (0.345, 0.631)" }, { "from": "gpt", "value": "(C) (0.345, 0.631)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d89422379060d15.jpg", "conversations": [ { "from": "human", "value": "\nIs bare branches at left above clear water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f369d30ba27bc729.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton scarf at center bigger than smooth stone statue at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, white cotton scarf at center might be smaller than smooth stone statue at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adba68d5221eceac.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.959, 0.895) (B) (0.545, 0.716)" }, { "from": "gpt", "value": "(B) (0.545, 0.716)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d798bfc03a5e967.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if printed fabric umbrella at center is smaller than metallic white chair at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f26efb26ce63c99.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.207, 0.111) (B) (0.420, 0.369)" }, { "from": "gpt", "value": "(A) (0.207, 0.111)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb8ed20ce8d419f4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) decorative paper umbrella at center (B) blue denim skirt at left (C) matte red cap at center (D) blue striped shirt at lower right" }, { "from": "gpt", "value": "(C) matte red cap at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/647719dd0eadf541.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white matte van at lower right located relative to white matte sedan at right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0ff1026657d5601.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte shirt at center behind white shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d16666369a5d14a6.jpg", "conversations": [ { "from": "human", "value": "\nIs glossy black water at center bigger than matte black canal boat at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, glossy black water at center is larger in size than matte black canal boat at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86047a65cbd81368.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the blue pinstripe suit at center? Choose from: (A) purple satin tie at left (B) black leather hand at center (C) black pinstripe suit at left (D) blue striped tie at right" }, { "from": "gpt", "value": "(D) blue striped tie at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d7dc024c301a4ab.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.525, 0.408) (B) (0.310, 0.567)" }, { "from": "gpt", "value": "(A) (0.525, 0.408)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e33b4a5da5a62b4c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.404, 0.880) (B) (0.447, 0.584) (C) (0.297, 0.552) (D) (0.059, 0.502)" }, { "from": "gpt", "value": "(A) (0.404, 0.880)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ab468afbe32f273.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.493, 0.664) (B) (0.344, 0.119) (C) (0.289, 0.797)" }, { "from": "gpt", "value": "(A) (0.493, 0.664)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38f3ca08f84f56bf.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of teal fabric shirt at left in relation to yellow fabric hospital bed at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9ebcfac2f1bbe4a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) purple cotton shirt at center (B) matte black suit at center (C) teal scarf at center" }, { "from": "gpt", "value": "(C) teal scarf at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4761a3e7555750c7.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.233, 0.688) (B) (0.440, 0.178)" }, { "from": "gpt", "value": "(A) (0.233, 0.688)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a552e572ea5efe08.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the dark gray fabric jacket at center? (A) white stone temple at left (B) gray stone man at lower center (C) gray stone steps at center" }, { "from": "gpt", "value": "(A) white stone temple at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86a9e48c7130acfd.jpg", "conversations": [ { "from": "human", "value": "\nIs blue striped shirt at left thinner than matte black sunglasses at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, blue striped shirt at left might be wider than matte black sunglasses at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d91e39ba97422d2.jpg", "conversations": [ { "from": "human", "value": "\nIs red matte jacket at right to the left of red matte life jacket at upper right from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, red matte jacket at right is to the right of red matte life jacket at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15c980c91a96c872.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) wooden table at lower right (B) green striped swimsuit at center" }, { "from": "gpt", "value": "(B) green striped swimsuit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8657aeea5eae3a3e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) matte black jacket at center (B) gray cotton t-shirt at left" }, { "from": "gpt", "value": "(B) gray cotton t-shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/490430d300bf2567.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray sweater at center appear on the left side of smooth red flower at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, dark gray sweater at center is not to the left of smooth red flower at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a26dddf9d412e82c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.851, 0.195) (B) (0.397, 0.769)" }, { "from": "gpt", "value": "(B) (0.397, 0.769)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e63fcf9cd597590.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) brown matte leaf at lower left (B) green matte leaf at lower center" }, { "from": "gpt", "value": "(A) brown matte leaf at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ccc1a1ca697823b.jpg", "conversations": [ { "from": "human", "value": "\nIs white snow-covered mountain at center smaller than orange softshell jacket at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white snow-covered mountain at center is not smaller than orange softshell jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a2ea8f93b4cb30a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.802, 0.925) (B) (0.033, 0.781) (C) (0.102, 0.614) (D) (0.819, 0.916)" }, { "from": "gpt", "value": "(C) (0.102, 0.614)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc3ad71686aab0a4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.966, 0.797) (B) (0.239, 0.553) (C) (0.569, 0.570)" }, { "from": "gpt", "value": "(A) (0.966, 0.797)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a827d8863b64b33.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is red dotted dress at center located relative to black suit at left? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/538ab6b77d562d03.jpg", "conversations": [ { "from": "human", "value": "\nIs beige brick building at center further to the viewer compared to matte beige building at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3d5cc2505ee3ae5.jpg", "conversations": [ { "from": "human", "value": "\nIs black cotton shirt at center further to the viewer compared to blue cotton t-shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/876ef6bf41fad55b.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown hair at left to the left of matte gray jacket at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find matte brown hair at left to the left of matte gray jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac1ffd7757c563e0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte white pillar at upper center is positioned to the left of clear glass window at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte white pillar at upper center is not on the left side of clear glass window at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b6da13305f66b08.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue pinstripe suit at left appear under light gray blazer at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, dark blue pinstripe suit at left is not positioned below light gray blazer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6eac72446b8bea79.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the matte black suit at center? Choose among these: (A) white zigzag shirt at right (B) black suit at left (C) white cloth table at center" }, { "from": "gpt", "value": "(B) black suit at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00c810aba8aa249a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if floral-patterned leggings at center is smaller than floral denim leggings at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, floral-patterned leggings at center might be larger than floral denim leggings at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27e2d9590390e6c3.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark hair at lower right have a smaller size compared to matte gray shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, dark hair at lower right is not smaller in size than matte gray shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eba01272413429e3.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) pink matte flower at upper left (B) pink matte pencil at upper right, is positioned farthest from the matte black marker at upper right?" }, { "from": "gpt", "value": "(A) pink matte flower at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16f0996e7dd02c8d.jpg", "conversations": [ { "from": "human", "value": "\nIs printed fabric shirt at center to the left of matte black sunglasses at left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, printed fabric shirt at center is not on the left side of matte black sunglasses at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/caa5d216f40c021a.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the smooth gray suit at right? Choose from: (A) brown leather jacket at center (B) matte blue shirt at left (C) brown cotton shirt at center (D) black satin suit at right" }, { "from": "gpt", "value": "(A) brown leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab4745e2efec05b0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray suit at center is positioned above dark gray wool suit at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, dark gray suit at center is not positioned above dark gray wool suit at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74289c9d7599a4fd.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) brown woven cowboy hat at lower left (B) green leafy palm tree at left" }, { "from": "gpt", "value": "(A) brown woven cowboy hat at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28ac932c243e0772.jpg", "conversations": [ { "from": "human", "value": "\nDoes white corrugated metal hut at lower center have a larger size compared to metallic silver water tower at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, white corrugated metal hut at lower center is larger in size than metallic silver water tower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/034bcffa3cd22707.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black sunglasses at upper left appear on the left side of purple fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find matte black sunglasses at upper left to the left of purple fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e895773666e72e0e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white matte water at center (B) white matte pipe at center" }, { "from": "gpt", "value": "(B) white matte pipe at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc8b15a28ddff15b.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow striped polo shirt at center thinner than yellow matte tank top at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, yellow striped polo shirt at center's width is not less than yellow matte tank top at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c07a67a9564f92c.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte shirt at center have a greater width compared to dark brown fabric coat at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white matte shirt at center is wider than dark brown fabric coat at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/047aea5850a4a05e.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver metallic fence at lower center come behind yellow jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d58472eee2e4ace.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) brown marble column at right (B) light gray fabric person at center" }, { "from": "gpt", "value": "(A) brown marble column at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c19be24566e3784.jpg", "conversations": [ { "from": "human", "value": "\nDoes velvet black tunic at right come in front of green sheer dress at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, velvet black tunic at right is behind green sheer dress at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1d3bfe6ff7d4261.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black coat at left above plaid woolen jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black coat at left is above plaid woolen jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31406afd775465fb.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth black hair at upper center have a greater width compared to matte black tank top at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, smooth black hair at upper center is not wider than matte black tank top at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85a197f7796d162a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) smooth yellow shirt at right (B) matte blue shirt at center" }, { "from": "gpt", "value": "(A) smooth yellow shirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f4c0305fc6dedfc.jpg", "conversations": [ { "from": "human", "value": "\nDoes gold damask blanket at center lie in front of velvet deep red curtain at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, gold damask blanket at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1789266f0e38917.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red paper with white polka dots at center thinner than wooden tray at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, matte red paper with white polka dots at center's width is less than wooden tray at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23e7536437f72b3b.jpg", "conversations": [ { "from": "human", "value": "\nWhere is light blue shirt at left located in relation to pink matte shorts at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9c37051341316cc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.842, 0.166) (B) (0.435, 0.444) (C) (0.532, 0.527)" }, { "from": "gpt", "value": "(B) (0.435, 0.444)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbe410bf638f6473.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gray shorts at center above orange matte golf cart at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte gray shorts at center is not positioned above orange matte golf cart at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1c0acee5d9fa968.jpg", "conversations": [ { "from": "human", "value": "\nDoes checkered fabric shirt at center appear over dark gray fabric shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, checkered fabric shirt at center is not above dark gray fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08d7695260e29dcd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) matte black dress at center (B) matte gray jacket at center (C) gray wool coat at center (D) black cotton polo shirt at center" }, { "from": "gpt", "value": "(A) matte black dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24e493e31ff1bd6a.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of white polished wood boat at center in relation to white wood paddle at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ee8c03a083a1845.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) dark blue jeans at center (B) flaming wood at center, is positioned closest to the white matte jacket at center?" }, { "from": "gpt", "value": "(B) flaming wood at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c120edbe2567a10.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of wooden cabin at center in relation to blue fabric at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0770bea7e1a397f.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of striped cotton shirt at center more distant than that of white matte jeep at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf0cf5d291e33703.jpg", "conversations": [ { "from": "human", "value": "\nIs gray wool suit at center positioned in front of pink fabric dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37197dc36647ced8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the matte red dress at left? Select from: (A) red matte sweater at center (B) navy blue sweater at center (C) translucent plastic container at lower right" }, { "from": "gpt", "value": "(C) translucent plastic container at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71ac2c50b05a1db2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if porcelain mosaic table at center is wider than metallic wire at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, porcelain mosaic table at center is wider than metallic wire at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c37f4bee68c1683a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white wooden table at center (B) white matte shirt at center (C) white matte shirt at left" }, { "from": "gpt", "value": "(B) white matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0190441b2346fc3c.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the red matte jacket at left from the following options: (A) white fleece jacket at center (B) gray synthetic life jacket at center (C) red softshell jacket at left (D) red/black neoprene life jacket at right?" }, { "from": "gpt", "value": "(C) red softshell jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16e8b09105f16608.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) blue backpack at center (B) matte blue shorts at center, is positioned farthest from the matte purple backpack at center?" }, { "from": "gpt", "value": "(B) matte blue shorts at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3594ffc850a54d3.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue plaid shirt at center have a smaller size compared to matte black shirt at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c1ae557130cb938.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the satin silver car at lower center? (A) shiny black sedan at center (B) concrete bridge at center" }, { "from": "gpt", "value": "(B) concrete bridge at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfabec7a18809ae4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the maroon silk robe at center? Select from: (A) green leather backpack at center (B) gold textured vest at center" }, { "from": "gpt", "value": "(A) green leather backpack at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1841dcb9c721fd16.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the white plastic printer at center? Choose among these: (A) black plastic table at center (B) black glossy microphone at upper right (C) white plastic register at right" }, { "from": "gpt", "value": "(B) black glossy microphone at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11c6efa1dd4e47b4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if tan suede jacket at center is positioned above white paper at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, tan suede jacket at center is below white paper at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d7cce0b285dbab8.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the yellow fabric shirt at center from the following options: (A) blue denim shirt at center (B) brushed metal shovel at lower left (C) brown soil at center?" }, { "from": "gpt", "value": "(A) blue denim shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a57a283a13d59e34.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.701, 0.662) (B) (0.636, 0.761) (C) (0.424, 0.205)" }, { "from": "gpt", "value": "(A) (0.701, 0.662)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4a4c0330387c222.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte blue shirt at upper left (B) transparent plastic table at center" }, { "from": "gpt", "value": "(B) transparent plastic table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d59dd941f94c304f.jpg", "conversations": [ { "from": "human", "value": "\nIs white paper banner at center to the right of matte black camera at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white paper banner at center is positioned on the right side of matte black camera at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a88c8a9045915e7e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the plaid shirt at center? (A) beige cotton t-shirt at upper right (B) metallic gray folding chair at lower left (C) gray fleece jacket at lower right" }, { "from": "gpt", "value": "(A) beige cotton t-shirt at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fd5eaf64c18b510.jpg", "conversations": [ { "from": "human", "value": "\nDoes white carved column at center appear on the right side of white marble column at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, white carved column at center is to the left of white marble column at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1fb257baeba7282a.jpg", "conversations": [ { "from": "human", "value": "\nIs white textured bath at center in front of wooden frame at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is in front of wooden frame at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b8e0e7fe6a985b2.jpg", "conversations": [ { "from": "human", "value": "\nIs white fluffy snow at lower center above brown grass at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white fluffy snow at lower center is not positioned above brown grass at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5be54b9e0a2058fa.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the matte red shirt at center among (A) velvet santa claus at center (B) white fleece jacket at right?" }, { "from": "gpt", "value": "(A) velvet santa claus at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3632bba55cbaa55.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue helmet at center have a greater width compared to sunglasses at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, matte blue helmet at center has a greater width compared to sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c8f29ebc781ab13.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) dark blue hoodie at center (B) white fabric pants at center" }, { "from": "gpt", "value": "(A) dark blue hoodie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb17719892dfb63d.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at left positioned behind white fabric at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/135e49ac535d0360.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte tank top at center is bigger than brown matte shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white matte tank top at center is bigger than brown matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eade86d118a09608.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.455, 0.922) (B) (0.610, 0.842)" }, { "from": "gpt", "value": "(A) (0.455, 0.922)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3597c55fdc3feaaf.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glass window at upper center is smaller than white glossy electric stove at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white glass window at upper center is not smaller than white glossy electric stove at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3dd38eee82e25ba.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at left wider than white glossy boat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, green leafy tree at left might be narrower than white glossy boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9645d1a76227395.jpg", "conversations": [ { "from": "human", "value": "\nIs dark amber liquid at upper center wider than silver metallic faucet at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, dark amber liquid at upper center is wider than silver metallic faucet at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7be2c3e1985e8d28.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of multicolored fabric jacket at center and multicolored face paint at center in the image provided, where is multicolored fabric jacket at center located with respect to multicolored face paint at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0dd69ce777442db5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) green mossy rock at center (B) smooth brown log at center (C) smooth bark tree at upper center" }, { "from": "gpt", "value": "(C) smooth bark tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d0819d33a7b8e7c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) brown wooden fence at right (B) weathered wood cabin at center (C) green wood tree at center" }, { "from": "gpt", "value": "(B) weathered wood cabin at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f8aee2df155ea45.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green leafy tree at left (B) white frothy water at center (C) blue water at center (D) green leafy tree at center" }, { "from": "gpt", "value": "(A) green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db08593fb9ee7f31.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gray suit at center above red striped tie at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte gray suit at center is not above red striped tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e60fd46a7dbeba15.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink wavy hair at center have a larger size compared to pink matte hand at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, pink wavy hair at center has a larger size compared to pink matte hand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ab28fb09c7b11c4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.191, 0.473) (B) (0.502, 0.373)" }, { "from": "gpt", "value": "(B) (0.502, 0.373)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aea19bec19117047.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) blue fabric shirt at lower left (B) checkered shirt at lower right (C) beige cotton shorts at center (D) gray hair at lower right, is positioned farthest from the brown cotton shirt at center?" }, { "from": "gpt", "value": "(D) gray hair at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15832be4f90e22ca.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) matte white screen at upper right (B) dark suit at right (C) light blue fabric shirt at lower left" }, { "from": "gpt", "value": "(C) light blue fabric shirt at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e30cbfb818d4e1c9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if ruby glass with spider design at right is positioned to the left of brown fuzzy teddy bear at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, ruby glass with spider design at right is not to the left of brown fuzzy teddy bear at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed6c24859e1b995d.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is red fabric canopy at upper center located relative to matte red blouse at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc940ab9604ab9d8.jpg", "conversations": [ { "from": "human", "value": "\nDoes cloudy sky at upper center have a lesser width compared to green textured mountain at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, cloudy sky at upper center's width is not less than green textured mountain at upper center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c32b025ad861e10.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the blue fabric flag at center among (A) white fabric flag at center (B) matte gray suit at left (C) red fabric flag at center (D) white matte projector screen at upper right?" }, { "from": "gpt", "value": "(C) red fabric flag at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52ce84674b77bad6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) gold polished trophy at center (B) black plastic pen at lower right (C) shiny dark wood table at center" }, { "from": "gpt", "value": "(A) gold polished trophy at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28fa051a99b52707.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.327, 0.887) (B) (0.231, 0.653)" }, { "from": "gpt", "value": "(A) (0.327, 0.887)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42d19de3a11e00c0.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte black dog at center located relative to beige fabric cap at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93fdd56ba4006541.jpg", "conversations": [ { "from": "human", "value": "\nDoes white paper at upper center have a smaller size compared to black paper at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white paper at upper center is not smaller than black paper at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5faad73d31588a39.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white matte trailer truck at right and neon yellow reflective suit at center in the image provided, where is white matte trailer truck at right located with respect to neon yellow reflective suit at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0daf51a242e2c94e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear glass window at left is bigger than matte brown countertop at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, clear glass window at left is not bigger than matte brown countertop at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c3ef6b7b079d555.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.593, 0.542) (B) (0.582, 0.573)" }, { "from": "gpt", "value": "(B) (0.582, 0.573)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec509c23637f76cd.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) shiny blue glass skyscraper at upper center (B) translucent glass pod at center" }, { "from": "gpt", "value": "(A) shiny blue glass skyscraper at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0cf2c908bd37ea6a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.288, 0.578) (B) (0.407, 0.500)" }, { "from": "gpt", "value": "(A) (0.288, 0.578)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba4060fded544b02.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white stone building at center is thinner than green stone moat at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white stone building at center is not thinner than green stone moat at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab18821240c99cae.jpg", "conversations": [ { "from": "human", "value": "\nDoes black tactical vest at center come in front of black matte/polished dog at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is in front of black matte/polished dog at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/695760759846a436.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if neon yellow reflective vest at center is smaller than matte black helmet at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61888bafe7eb8bbe.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of brown textured shorts at center more distant than that of blue denim shorts at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c363d6234112b41.jpg", "conversations": [ { "from": "human", "value": "\nDoes golden stone tower at center appear on the left side of golden brick building at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, golden stone tower at center is not on the left side of golden brick building at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/379ad4be74dc9c43.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.196, 0.523) (B) (0.249, 0.622) (C) (0.649, 0.452)" }, { "from": "gpt", "value": "(C) (0.649, 0.452)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bd37c80b91cfd02.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) bronze horse at center (B) bronze muscular figure at center" }, { "from": "gpt", "value": "(B) bronze muscular figure at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f29abb3584792c65.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte tank top at center is thinner than black matte hand at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black matte tank top at center is not thinner than black matte hand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98d44f562479854d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) floral fabric dress at center (B) yellow cotton shirt at center (C) matte green tank top at center (D) green striped shirt at center" }, { "from": "gpt", "value": "(D) green striped shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85d88db051580f57.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) dark brown hair at lower right (B) white heart-patterned shirt at center (C) white paper cup at center" }, { "from": "gpt", "value": "(B) white heart-patterned shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ec2d4a33c9ee954.jpg", "conversations": [ { "from": "human", "value": "\nIs satin gold microwave at center wider than satin stainless steel exhaust hood at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58cfc8fbe4110369.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.306, 0.472) (B) (0.508, 0.328)" }, { "from": "gpt", "value": "(A) (0.306, 0.472)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b43a2b36f4436bc3.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown textured waterfall at center come in front of green leafy trees at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e59f206279b00125.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.318, 0.703) (B) (0.604, 0.811)" }, { "from": "gpt", "value": "(B) (0.604, 0.811)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/103e1b2b72013498.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the purple striped shirt at upper right among (A) smooth black table at center (B) translucent plastic cup at upper right?" }, { "from": "gpt", "value": "(A) smooth black table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83c031745d200fd2.jpg", "conversations": [ { "from": "human", "value": "\nWhere is gray stone pavement at lower center located in relation to dark gray coat at right in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b276ab634309b43.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) camouflage uniform at left (B) black matte shotgun at center (C) matte black earplugs at left, is positioned closest to the black matte gun at center?" }, { "from": "gpt", "value": "(B) black matte shotgun at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06ad5d07d976ffd0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) white fabric shirt at lower right (B) dark brown leather jacket at lower center (C) light beige fabric jacket at lower left (D) dark brown leather jacket at lower right" }, { "from": "gpt", "value": "(C) light beige fabric jacket at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d0e8d30050df4f2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) gray matte mud at upper right (B) textured fabric hand at upper left" }, { "from": "gpt", "value": "(B) textured fabric hand at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17456271e85015cb.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue soft baby at center appear under rubberized red apple at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, blue soft baby at center is positioned under rubberized red apple at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adcdc3675824d4e2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) smooth concrete stairs at lower right (B) transparent glass window at center" }, { "from": "gpt", "value": "(B) transparent glass window at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f47a80d1efbb8d0.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) green grass football field at center (B) black matte jacket at right" }, { "from": "gpt", "value": "(B) black matte jacket at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04725085c2e2804d.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the yellow tie-dye shirt at center among (A) camouflage fabric shirt at center (B) dark gray hair at center?" }, { "from": "gpt", "value": "(B) dark gray hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c35a9c669a283cc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) smooth sand at lower center (B) black matte jacket at center" }, { "from": "gpt", "value": "(B) black matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fba8a5251c04174.jpg", "conversations": [ { "from": "human", "value": "\nWhere is whiteboard at upper center located in relation to white smooth shirt at upper left in the image? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17e447d542b0fe9b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) matte black microphone at center (B) natural wood acoustic guitar at center (C) matte brown guitar at center (D) natural wood acoustic guitar at left" }, { "from": "gpt", "value": "(B) natural wood acoustic guitar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45ac3bfdd3048bf2.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of brown dry bush at left in relation to brown dry at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7779946fc0025fb.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte black camera at center located relative to black matte camera at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7647a91ddcfaf12b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) brown rough tree branch at upper center (B) brown/reflective water at center" }, { "from": "gpt", "value": "(A) brown rough tree branch at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c8930fd673e2611.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if cloudy sky at upper center is positioned to the left of matte gray tower at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, cloudy sky at upper center is to the right of matte gray tower at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc814bf0b34499c4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) dark gray fabric shirt at left (B) shiny metallic bicycle at lower left" }, { "from": "gpt", "value": "(B) shiny metallic bicycle at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6425afaa4fcbe716.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte shorts at center is wider than white matte tank top at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of black matte shorts at center exceeds that of white matte tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdd49ce50ce808f6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.478, 0.264) (B) (0.799, 0.147) (C) (0.797, 0.102) (D) (0.385, 0.730)" }, { "from": "gpt", "value": "(D) (0.385, 0.730)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f549cf15646ae44.jpg", "conversations": [ { "from": "human", "value": "\nDoes white cotton shorts at right have a lesser width compared to white cotton t-shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white cotton shorts at right's width is not less than white cotton t-shirt at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/449373db064af77c.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black jacket at center thinner than black matte jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, matte black jacket at center might be wider than black matte jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93a1ab9e037c04e8.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped shirt at center come in front of striped cotton shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, striped shirt at center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16c52a23c8b464bf.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center appear on the left side of green leafy tree at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find green leafy tree at center to the left of green leafy tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/065f02d785aaa16e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) brown wooden table at center (B) matte black suit at center, is positioned closest to the green dotted tie at center?" }, { "from": "gpt", "value": "(B) matte black suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca5bba0176bfd5e9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) gray water at center (B) dark gray fur seal at center" }, { "from": "gpt", "value": "(B) dark gray fur seal at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14fd81330223fb89.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue jacket at center have a lesser width compared to black matte goggles at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte blue jacket at center is not thinner than black matte goggles at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3db635babcf76c88.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the jeans at lower center from the following options: (A) white fleece jacket at center (B) pink fleece onesie at lower right (C) brown leather jacket at upper right?" }, { "from": "gpt", "value": "(C) brown leather jacket at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36cb1ac1f443b85e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.572, 0.772) (B) (0.412, 0.580)" }, { "from": "gpt", "value": "(A) (0.572, 0.772)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c72b47ec56c3040.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grassy field at lower center is thinner than green leafy tree at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green grassy field at lower center's width is not less than green leafy tree at lower left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ee8d6071b923a87.jpg", "conversations": [ { "from": "human", "value": "\nIs whipped cream with chocolate chips at center positioned in front of white creamy ice cream with colorful candies at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e745160e50ad531.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white knitted hat at center (B) striped knit scarf at left" }, { "from": "gpt", "value": "(A) white knitted hat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5a7582171557ab4.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the green grassy at lower center? (A) green leafy tree at upper left (B) clear water at center" }, { "from": "gpt", "value": "(B) clear water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0609acdfbfe87e8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.170, 0.520) (B) (0.699, 0.330) (C) (0.196, 0.430)" }, { "from": "gpt", "value": "(B) (0.699, 0.330)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1253cb5aa1e3bb2d.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow plastic toy at center positioned behind pink matte toy at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, yellow plastic toy at center is in front of pink matte toy at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9d73900047572f5.jpg", "conversations": [ { "from": "human", "value": "\nDoes denim jacket at center have a lesser width compared to light gray pants at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, denim jacket at center has a lesser width compared to light gray pants at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1196cfc14d232877.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) snow-covered evergreen tree at center (B) wooden bench at lower center (C) smooth bark tree at center" }, { "from": "gpt", "value": "(A) snow-covered evergreen tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8eb12f1ed0c977aa.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of white cotton shirt at center in relation to white fluffy beard at left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ff6f292c7a5b21a.jpg", "conversations": [ { "from": "human", "value": "\nIs light brown wood boat at left smaller than smooth white boat at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, light brown wood boat at left is smaller than smooth white boat at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba7ced75ec6612eb.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the white waxy candle at center? Select from: (A) floral cotton shirt at center (B) green matte table at center (C) green striped shirt at center" }, { "from": "gpt", "value": "(A) floral cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f21d0ea7a05541e0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange matte face at center is positioned to the right of white t-shirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, orange matte face at center is to the right of white t-shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6249e0cb7f77eb77.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of brown matte tree at left in reference to bare branches at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c68a9c270695c69a.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy mountain range at center above purple matte flower at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35984f7f76a2fefb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray fabric crowd at center is smaller than dark gray fabric jacket at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ece2978f6aaa63a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at center is smaller than glossy black car at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, green grass at center might be larger than glossy black car at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdc9ec271dc5c932.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.926, 0.133) (B) (0.402, 0.422)" }, { "from": "gpt", "value": "(A) (0.926, 0.133)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8f46b305fd50aa0.jpg", "conversations": [ { "from": "human", "value": "\nIs bronze statue at center to the left of matte blue dress at left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, bronze statue at center is to the right of matte blue dress at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f4d12f70cb2d478.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.590, 0.405) (B) (0.831, 0.550) (C) (0.234, 0.386)" }, { "from": "gpt", "value": "(B) (0.831, 0.550)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e322c1cb717e526d.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte uniform at center have a greater width compared to matte black binoculars at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, black matte uniform at center has a greater width compared to matte black binoculars at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f79e8f60bbe187e.jpg", "conversations": [ { "from": "human", "value": "\nIs white knitted hat at left wider than white translucent iceberg at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f286f17cc0f38d8.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of matte gray hoodie at center and dark gray hoodie at center in the image provided, where is matte gray hoodie at center located with respect to dark gray hoodie at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ce433f405349c18.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.876, 0.936) (B) (0.219, 0.822) (C) (0.494, 0.558)" }, { "from": "gpt", "value": "(A) (0.876, 0.936)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72df8def0f90f989.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.776, 0.316) (B) (0.398, 0.536) (C) (0.442, 0.633)" }, { "from": "gpt", "value": "(B) (0.398, 0.536)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12804296996067ac.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark blue water at center is positioned to the left of metallic gray barge at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dark blue water at center is not to the left of metallic gray barge at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a6d7464fff61425.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.885, 0.403) (B) (0.932, 0.291) (C) (0.335, 0.703)" }, { "from": "gpt", "value": "(B) (0.932, 0.291)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56bc8b6ae56560f2.jpg", "conversations": [ { "from": "human", "value": "\nDoes white embroidered shirt at center appear on the right side of black matte jacket at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find white embroidered shirt at center to the right of black matte jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ce1bf56c3269fcd.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the gold ornate dress at center from the following options: (A) black matte shirt at center (B) green satin hijab at center (C) green silk hijab at upper center?" }, { "from": "gpt", "value": "(B) green satin hijab at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4f73f1ca14503f2.jpg", "conversations": [ { "from": "human", "value": "\nDoes satin silver sedan at lower left have a greater width compared to satin silver suv at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, satin silver sedan at lower left is wider than satin silver suv at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47ac9cae781dcb00.jpg", "conversations": [ { "from": "human", "value": "\nDoes blonde hair at center lie behind matte plastic comb at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b21688cef7c3d571.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown blouse at center positioned at the back of black matte shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of black matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb1540e20076da72.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if silver metallic car at center is positioned to the left of light blue matte hatchback at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, silver metallic car at center is to the left of light blue matte hatchback at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44ad927401c8354a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) gray fabric shirt at center (B) blue fabric baseball cap at center" }, { "from": "gpt", "value": "(B) blue fabric baseball cap at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe5b4d8da6eca58c.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center come behind green leafy tree at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c19d57eebbfc7ff.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.061, 0.639) (B) (0.895, 0.723)" }, { "from": "gpt", "value": "(A) (0.061, 0.639)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4191de8ac64e5370.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if snowy granite mountain range at upper center is positioned below green matte tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, snowy granite mountain range at upper center is not positioned below green matte tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e497b50614db494.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) striped cotton shirt at center (B) pink cotton shirt at center (C) pink fabric at left, is positioned farthest from the polka dot fabric dress at right?" }, { "from": "gpt", "value": "(C) pink fabric at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b74805c2f2a221fd.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the green stone bridge at center? Choose from: (A) golden stone clock tower at right (B) golden stone tower at left" }, { "from": "gpt", "value": "(A) golden stone clock tower at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/170caa1ff0bee381.jpg", "conversations": [ { "from": "human", "value": "\nIs matte beige lingerie at center smaller than porcelain figurine at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte beige lingerie at center is not smaller in size than porcelain figurine at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4761db6d6084227c.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green grassy at center and green grassy at right in the image provided, where is green grassy at center located with respect to green grassy at right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16c973b05d5cc1e7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light gray fabric business suit at left is positioned above light blue silk tie at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, light gray fabric business suit at left is positioned over light blue silk tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6671791ae1d1e466.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.384, 0.145) (B) (0.684, 0.334) (C) (0.543, 0.891)" }, { "from": "gpt", "value": "(C) (0.543, 0.891)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9d5cbe2a267246b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.479, 0.395) (B) (0.521, 0.677) (C) (0.590, 0.745)" }, { "from": "gpt", "value": "(B) (0.521, 0.677)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6070b20d983c5c0a.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of white sand at lower left more distant than that of red fabric umbrella at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/294cc8269e6c7678.jpg", "conversations": [ { "from": "human", "value": "\nDoes light blue denim jeans at center have a larger size compared to matte white jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, light blue denim jeans at center has a larger size compared to matte white jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b0c9abb78cf15fa.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the camouflage jacket at center? Choose among these: (A) black leather jacket at center (B) brown leather jacket at center" }, { "from": "gpt", "value": "(A) black leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f2a5b34b2c2a93c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) wooden polished cello at right (B) matte red shirt at left" }, { "from": "gpt", "value": "(B) matte red shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/674084dd7f9afa09.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown dirt track at lower center appear on the right side of rusty metal hut at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, brown dirt track at lower center is positioned on the right side of rusty metal hut at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de576ac1dc5809af.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black jacket at left appear over matte skin at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte black jacket at left is not positioned above matte skin at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d9881c4b6e0da51.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) white matte head at lower center (B) white matte shirt at lower right" }, { "from": "gpt", "value": "(A) white matte head at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9588905d0d338ba.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white cotton shirt at upper right (B) black felt cowboy hat at upper center" }, { "from": "gpt", "value": "(B) black felt cowboy hat at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71d802db6cbca166.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy bush at center-right have a greater width compared to stone tower at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3bab2eb4a4efb40.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.838, 0.853) (B) (0.891, 0.553)" }, { "from": "gpt", "value": "(A) (0.838, 0.853)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b6c644ea8d35966.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black metal lamp post at left is positioned above metallic silver bench at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black metal lamp post at left is above metallic silver bench at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb8db3002292e0a4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown sandy ground at center is smaller than golden fur lion at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, brown sandy ground at center is not smaller than golden fur lion at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f5a909c9a5cfe29.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the smooth skin face at upper right among (A) yellow matte license plate at center (B) metallic yellow license plate at center?" }, { "from": "gpt", "value": "(B) metallic yellow license plate at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0b7e7ccc760619d.jpg", "conversations": [ { "from": "human", "value": "\nWhere is plaid fabric shirt at center located in relation to white matte helmet at lower right in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b145fa175b814ac8.jpg", "conversations": [ { "from": "human", "value": "\nIs rustic rock canyon at center to the left of light blue fleece at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, rustic rock canyon at center is to the right of light blue fleece at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00f3b4707ac603d1.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.087, 0.019) (B) (0.613, 0.347) (C) (0.686, 0.547) (D) (0.750, 0.883)" }, { "from": "gpt", "value": "(B) (0.613, 0.347)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22612db45d933eef.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green spiky cactus at left (B) green spiky cactus at center" }, { "from": "gpt", "value": "(A) green spiky cactus at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4aac02d1f996e3d8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.046, 0.764) (B) (0.530, 0.637) (C) (0.278, 0.606)" }, { "from": "gpt", "value": "(B) (0.530, 0.637)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b712f0ca2ec68113.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) gray rough boulder at center (B) gray rough rock at lower left (C) green mossy rock at center" }, { "from": "gpt", "value": "(C) green mossy rock at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82ebab3c0a9622fc.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the matte plastic cup at center among (A) black wood table at lower center (B) striped shirt at center (C) gray suit jacket at right (D) dark gray suit at center?" }, { "from": "gpt", "value": "(C) gray suit jacket at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dce3cada72234ace.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.530, 0.744) (B) (0.137, 0.184)" }, { "from": "gpt", "value": "(B) (0.137, 0.184)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d826a6724b2fe98c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) black matte eye at center (B) bubble wrap at center (C) soft fabric hair at right" }, { "from": "gpt", "value": "(C) soft fabric hair at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ebdabbd7b99d179d.jpg", "conversations": [ { "from": "human", "value": "\nIs white fluffy cloud at upper left further to the viewer compared to brown polished column at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/774cde8abbae7b86.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.430, 0.544) (B) (0.133, 0.186)" }, { "from": "gpt", "value": "(A) (0.430, 0.544)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bfe2614cc4418af.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte refrigerator at right positioned behind white glossy sink at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of white glossy sink at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25da465423c47c27.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of black matte grill at lower right in reference to bright pink petals at lower center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a9e98f54702e2a1.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of smooth concrete tarmac at center less distant than that of white glossy airplane at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, smooth concrete tarmac at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2426a68b3f7f142.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) metallic silver microphone at center (B) denim jacket at center" }, { "from": "gpt", "value": "(B) denim jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57776f6fa53a33d3.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.249, 0.805) (B) (0.266, 0.672) (C) (0.699, 0.670) (D) (0.522, 0.831)" }, { "from": "gpt", "value": "(A) (0.249, 0.805)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d584333ef9b66b30.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.230, 0.623) (B) (0.738, 0.719) (C) (0.745, 0.225)" }, { "from": "gpt", "value": "(B) (0.738, 0.719)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb32f6fb48ec4b82.jpg", "conversations": [ { "from": "human", "value": "\nDoes light blue checkered shirt at center appear under white shirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, light blue checkered shirt at center is located below white shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/970b4cc6af2b89d4.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown wooden track at center have a greater width compared to blue and white striped locomotive at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown wooden track at center is wider than blue and white striped locomotive at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88ac8a63ce40d67b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.498, 0.916) (B) (0.732, 0.486)" }, { "from": "gpt", "value": "(B) (0.732, 0.486)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d041f53f8d8d7bd.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black monitor at upper center have a lesser width compared to matte plastic monitor at center-left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black monitor at upper center is not thinner than matte plastic monitor at center-left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/096df3eac922ba2c.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white matte shirt at lower right located relative to white cotton shirt at lower center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff6e2091d461acd8.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue water at center have a greater width compared to white plastic boat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, blue water at center is wider than white plastic boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30ccfb6d4601e262.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is clear textured glass jar at center located relative to clear plastic bottle at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c00989381606e80.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny silver jacket at center have a smaller size compared to matte blue fish at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, shiny silver jacket at center has a smaller size compared to matte blue fish at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c8da06cb3c0566d.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the white glossy projector screen at center among (A) matte black chair at center (B) floral fabric dress at lower right?" }, { "from": "gpt", "value": "(A) matte black chair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f116b3b40bab6cab.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent glass door at left have a greater width compared to light beige pants at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of transparent glass door at left exceeds that of light beige pants at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/080a36af6ac480e6.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte oven at bottom appear on the left side of shiny silver frying pan at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find black matte oven at bottom to the left of shiny silver frying pan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/169ef6c718e87fa0.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue jeans at center appear under matte beige backpack at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, dark blue jeans at center is below matte beige backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9b55ac593c227d3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) black glossy smartphone at center (B) matte glass screen at center" }, { "from": "gpt", "value": "(B) matte glass screen at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7aece1ee25a30cbf.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) black plastic sign at upper center (B) white plastic sign at lower center (C) white cotton shirt at center (D) matte white sunglasses at center" }, { "from": "gpt", "value": "(A) black plastic sign at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9980f651dbb2f03e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the green fabric at center? Select from: (A) white woolen coat at center (B) blue linen tunic at center" }, { "from": "gpt", "value": "(A) white woolen coat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6fbf7e05dd385635.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray suit at center is positioned to the right of satin gold jacket at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find dark gray suit at center to the right of satin gold jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd605782859b5e1f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.672, 0.497) (B) (0.240, 0.489) (C) (0.213, 0.498)" }, { "from": "gpt", "value": "(A) (0.672, 0.497)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52f3e27cfa0aabe5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black leather jacket at center is positioned below dark brown leather jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3213d4ef0fbd01e8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.277, 0.320) (B) (0.782, 0.719)" }, { "from": "gpt", "value": "(B) (0.782, 0.719)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a119b802fc97216.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.106, 0.997) (B) (0.621, 0.841)" }, { "from": "gpt", "value": "(B) (0.621, 0.841)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3723a4065778363c.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green grassy hill at upper center less distant than that of brown dusty road at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa680aa2897fba0c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the gold shiny trombone at right? (A) gold shiny trumpet at right (B) gold shiny trumpet at left" }, { "from": "gpt", "value": "(B) gold shiny trumpet at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b761789f00388a1a.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black shirt at center lie behind red printed dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/808fa2708fb1601a.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny metallic pants at center to the right of white matte tank top at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, shiny metallic pants at center is not to the right of white matte tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d97c4e2e1f004951.jpg", "conversations": [ { "from": "human", "value": "\nIs green rough textured tree at center further to camera compared to metallic silver ladder at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7801a0630338d37b.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy hedge at lower right have a greater width compared to shiny metallic bicycle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ebabc8b56de467b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.850, 0.342) (B) (0.402, 0.562)" }, { "from": "gpt", "value": "(A) (0.850, 0.342)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01c711407f5e4fbc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red matte signboard at center is positioned to the left of white painted signboard at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, red matte signboard at center is to the left of white painted signboard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a44d8e32255ac9b.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte shirt at center appear over blue fabric shirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6cde0d451df230d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green grass at center (B) yellow striped spider at center" }, { "from": "gpt", "value": "(B) yellow striped spider at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38820dfd84737c3b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) matte gray jeans at left (B) purple matte shirt at upper right (C) smooth sand at lower center" }, { "from": "gpt", "value": "(B) purple matte shirt at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/940ef0f28fd19d8c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the metallic silver laptop at center? Choose among these: (A) pink matte shirt at center (B) black plastic speaker at lower center (C) blue fabric table at center" }, { "from": "gpt", "value": "(A) pink matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2794fe7a05837f3c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.275, 0.647) (B) (0.899, 0.816)" }, { "from": "gpt", "value": "(A) (0.275, 0.647)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa0feec8f2e76498.jpg", "conversations": [ { "from": "human", "value": "\nIs brown polished wood table at center smaller than black plastic microphone at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, brown polished wood table at center is not smaller in size than black plastic microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/171affba3b2c47cf.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.189, 0.009) (B) (0.676, 0.637) (C) (0.444, 0.794)" }, { "from": "gpt", "value": "(A) (0.189, 0.009)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0103a1ad61cf2c04.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the illuminated plastic tree at right? Choose from: (A) illuminated plastic tree at center (B) illuminated white tree at center" }, { "from": "gpt", "value": "(A) illuminated plastic tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6dd1851733aac29.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the dark suit at center? (A) purple silk tie at center (B) brown fabric table at center" }, { "from": "gpt", "value": "(B) brown fabric table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4465b35905a5872.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) blue fabric jacket at center (B) green fabric jacket at center (C) jeans at center" }, { "from": "gpt", "value": "(B) green fabric jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c9f7aac9a82cac6.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy plant at center appear on the right side of green leafy plant at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy plant at center is to the right of green leafy plant at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28f60dd68de76468.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow uniform shirt at center have a larger size compared to yellow fabric cap at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, yellow uniform shirt at center is larger in size than yellow fabric cap at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99e4e3be30e05325.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte black pencil at center (B) green matte exercise book at center" }, { "from": "gpt", "value": "(A) matte black pencil at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8ef6c758a7c47d7.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte black bed at center (B) black cotton shirt at left (C) matte black jacket at center" }, { "from": "gpt", "value": "(B) black cotton shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14b7808b89f1cc46.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if sandy yellow at lower left is positioned below green leafy palm tree at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, sandy yellow at lower left is located below green leafy palm tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cece85d42879f83.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy trees at center appear on the right side of green matte tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, green leafy trees at center is to the left of green matte tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2706dab4c26f78cb.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of black metallic sedan at center more distant than that of white plastic license plate at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e575f37d0f336e4.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.500, 0.497) (B) (0.534, 0.717)" }, { "from": "gpt", "value": "(B) (0.534, 0.717)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18ec1e8e56b23fab.jpg", "conversations": [ { "from": "human", "value": "\nWhere is blue fabric face at center located in relation to white glossy car at upper right in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40dff8a67e501686.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) red matte baseball cap at center (B) blue fabric baseball cap at center (C) blue fabric cap at center (D) blue fabric hoodie at center" }, { "from": "gpt", "value": "(A) red matte baseball cap at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d6523a4cce05206.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth steel tracks at center is bigger than brown wooden passenger train at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, smooth steel tracks at center is not bigger than brown wooden passenger train at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04f9b9f9366c8231.jpg", "conversations": [ { "from": "human", "value": "\nDoes white paper sign at center have a larger size compared to white paper at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5cc9d8df2edc7ea.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny blue shorts at center come in front of blue shirt at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, shiny blue shorts at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8861b25dcde49383.jpg", "conversations": [ { "from": "human", "value": "\nIs skinny white hand at center above dark brown fuzzy beard at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, skinny white hand at center is not above dark brown fuzzy beard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d0aceca378c1fa5.jpg", "conversations": [ { "from": "human", "value": "\nDoes glistening water at center have a smaller size compared to black matte dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a1bc88e52005fbf5.jpg", "conversations": [ { "from": "human", "value": "\nIs brown suede shirt at left bigger than blue dotted tie at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ef804c23d86493e.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green mossy tree at center in relation to golden brown feathered rooster at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83045c89542cb849.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white/red painted coach at upper left in reference to metallic red dalek at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3de43a26387318ca.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped sweater at left have a larger size compared to plaid fabric shirt at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7ee96292b4718f0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if beige stone palace at center is wider than black metal rail at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of beige stone palace at center exceeds that of black metal rail at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9eb719beaefc2276.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth bark tree trunk at center have a larger size compared to brown suede vest at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, smooth bark tree trunk at center is not bigger than brown suede vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/214a7724f1f4f93e.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of blue fabric shirt at center and black metal fence at lower center in the image provided, where is blue fabric shirt at center located with respect to black metal fence at lower center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6eac9ea5f7f8422.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) black fabric curtain at center (B) matte black monitor at center" }, { "from": "gpt", "value": "(B) matte black monitor at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18e1ad45d6a4545e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) dark brown wooden cello at center (B) matte black blazer at left" }, { "from": "gpt", "value": "(B) matte black blazer at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f7522c3540c89ec.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny brown fur at center is smaller than spotted fur dog at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, shiny brown fur at center is smaller than spotted fur dog at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/412de5cc5aa139f9.jpg", "conversations": [ { "from": "human", "value": "\nIs orange satin dress at right further to camera compared to purple matte shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d041cfbe9bd053a.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of black fleece jacket at center in reference to matte red jacket at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7653679a07f465f7.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte shirt at center appear on the right side of white striped birthday candle at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white matte shirt at center is not on the right side of white striped birthday candle at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/712f10c13d8a8bd4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) matte gray backpack at center (B) black plastic sunglasses at upper left" }, { "from": "gpt", "value": "(B) black plastic sunglasses at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aca6912c090f7392.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.871, 0.528) (B) (0.652, 0.644) (C) (0.549, 0.947)" }, { "from": "gpt", "value": "(A) (0.871, 0.528)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d16053425fcf9c6.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte brown hair at center have a greater width compared to matte black glasses at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, matte brown hair at center might be narrower than matte black glasses at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c15bd67b0e901202.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) black fluffy dog at center (B) white fluffy dog at center" }, { "from": "gpt", "value": "(A) black fluffy dog at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4ff99c33da37bdc.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of dark blue suit at center more distant than that of matte black microphone at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, dark blue suit at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbb5f806bba48432.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is smooth asphalt highway at lower center located relative to yellow plastic sign at lower right? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0d46f8f764143b2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.564, 0.333) (B) (0.040, 0.427)" }, { "from": "gpt", "value": "(A) (0.564, 0.333)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c486192595fb49a.jpg", "conversations": [ { "from": "human", "value": "\nIs white feathered bird at center below matte brown bird at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, white feathered bird at center is located below matte brown bird at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/946cf6f040bba444.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.706, 0.964) (B) (0.450, 0.534) (C) (0.527, 0.834)" }, { "from": "gpt", "value": "(A) (0.706, 0.964)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e015929fb0e2fc9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) brown woolen sheep at center (B) white woolen lamb at center" }, { "from": "gpt", "value": "(B) white woolen lamb at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1df6e24490974c65.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the denim pants at lower right? (A) purple cotton pants at center (B) spray paint sign at center (C) white fabric at center" }, { "from": "gpt", "value": "(C) white fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5567b6cf713d56c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.620, 0.505) (B) (0.563, 0.581) (C) (0.132, 0.633) (D) (0.130, 0.364)" }, { "from": "gpt", "value": "(A) (0.620, 0.505)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d609d7ced8e15a5e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the blue fleece blanket at center? (A) transparent glass window at upper center (B) gray fluffy cat at center" }, { "from": "gpt", "value": "(B) gray fluffy cat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b669d50e85413f11.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at lower center appear on the right side of orange striped tiger at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green grass at lower center is positioned on the right side of orange striped tiger at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93324f0507b829f1.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte white t-shirt at upper center appear on the left side of striped shirt at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte white t-shirt at upper center is to the left of striped shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a33bf7da37672b1.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the brown fur at lower left? (A) brown textured wood at center (B) brown feathered falcon at center" }, { "from": "gpt", "value": "(A) brown textured wood at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f11216f46ff4262.jpg", "conversations": [ { "from": "human", "value": "\nIs light beige sweater at center to the right of floral fabric dress at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, light beige sweater at center is not on the right side of floral fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb362a26b93b7225.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.932, 0.745) (B) (0.869, 0.533) (C) (0.537, 0.795) (D) (0.693, 0.819)" }, { "from": "gpt", "value": "(B) (0.869, 0.533)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/503dca8aa3e6d678.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.927, 0.952) (B) (0.755, 0.536) (C) (0.455, 0.483)" }, { "from": "gpt", "value": "(B) (0.755, 0.536)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f5462043ce89254.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the matte black handgun at center? Choose among these: (A) brown leather jacket at center (B) matte red jacket at upper left" }, { "from": "gpt", "value": "(B) matte red jacket at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff1ff854ea936591.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) brown bark tree at right (B) brown bark tree at left" }, { "from": "gpt", "value": "(A) brown bark tree at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/988b620932fee559.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dark gray t-shirt at left (B) tan cotton shirt at center (C) gray cotton t-shirt at center (D) teal striped polo shirt at center" }, { "from": "gpt", "value": "(A) dark gray t-shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fd946568e0205db.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) shiny blue car at left (B) red shirt at center" }, { "from": "gpt", "value": "(A) shiny blue car at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f75e3c76ce6d1f4.jpg", "conversations": [ { "from": "human", "value": "\nIs brown textured suit at center in front of black textured shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown textured suit at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68ff5e372d9845ac.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte striped shirt at center appear over dark gray metal eiffel tower at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e49f5b31bb295b6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the matte black car at left? Choose among these: (A) glossy black sedan at center (B) matte black car at center (C) black plastic license plate at center" }, { "from": "gpt", "value": "(A) glossy black sedan at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01a49b6659c455c3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) white glossy airplane tail at right (B) red matte ship at center (C) white matte tugboat at center" }, { "from": "gpt", "value": "(A) white glossy airplane tail at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1f3baa5cc4f0b37.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white paper banner at center is smaller than white paper sign at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b19ed4cae364f475.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown leafy tree at center is bigger than yellow-green foliage at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, brown leafy tree at center is larger in size than yellow-green foliage at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0c78e27eb955f92.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden table at center is positioned above black glossy router at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, wooden table at center is below black glossy router at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85752a683e787058.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the white plastic sign at upper center? Choose among these: (A) white stone sculpture at upper left (B) white stone angel at center" }, { "from": "gpt", "value": "(A) white stone sculpture at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82d976e8871ead16.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) yellow metallic excavator at left (B) white fabric fence at center, is positioned closest to the orange fabric at center?" }, { "from": "gpt", "value": "(B) white fabric fence at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a75de17e7bde2506.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of gray sweater at center and blue fabric bean bag at center in the image provided, where is gray sweater at center located with respect to blue fabric bean bag at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88fa36f4d842d54d.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow synthetic leather glove at center appear over yellow leather boxing glove at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, yellow synthetic leather glove at center is below yellow leather boxing glove at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d09149be7f7d95ba.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.312, 0.688) (B) (0.880, 0.175)" }, { "from": "gpt", "value": "(B) (0.880, 0.175)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4b50a07107e0939.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the brown leather jacket at upper right? Select from: (A) yellow matte orange at center (B) matte black sweater at center (C) translucent plastic container at lower left" }, { "from": "gpt", "value": "(C) translucent plastic container at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c20a300f933b458.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton sweater at center above green scarf at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white cotton sweater at center is positioned over green scarf at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db0cf1d0942be644.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.257, 0.713) (B) (0.145, 0.997)" }, { "from": "gpt", "value": "(A) (0.257, 0.713)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e8bfe51122ca081.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.363, 0.764) (B) (0.491, 0.727)" }, { "from": "gpt", "value": "(B) (0.491, 0.727)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f105a53e5cfae611.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of teal fabric shorts at center less distant than that of matte white shirt at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, teal fabric shorts at center is in front of matte white shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ea5a313c612f3da.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) pink matte flower at center (B) green matte tree at center (C) green leafy tree at center" }, { "from": "gpt", "value": "(C) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50ad5a10c5ce8c47.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.154, 0.978) (B) (0.457, 0.694) (C) (0.384, 0.259) (D) (0.512, 0.202)" }, { "from": "gpt", "value": "(A) (0.154, 0.978)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/916433991fae2e57.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) transparent water at lower right (B) green leafy tree at center (C) gray volcanic rock mountain at center" }, { "from": "gpt", "value": "(A) transparent water at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b146e220acd5c9d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black coat at center is thinner than knitted wool sweater at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black coat at center is not thinner than knitted wool sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1265ee6844e9c5d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.382, 0.344) (B) (0.213, 0.561)" }, { "from": "gpt", "value": "(B) (0.213, 0.561)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25b50ea43603a3f7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.518, 0.494) (B) (0.182, 0.448)" }, { "from": "gpt", "value": "(A) (0.518, 0.494)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bc963d1df8a1dba.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) dark brown textured food at center (B) smooth skin man at center (C) smooth brown nuts at lower right (D) smooth brown rice at lower right" }, { "from": "gpt", "value": "(B) smooth skin man at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e08d99c1c5026644.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) blue striped shirt at center (B) black fabric headscarf at center" }, { "from": "gpt", "value": "(B) black fabric headscarf at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cae37f8f4ad52c07.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.448, 0.333) (B) (0.266, 0.983)" }, { "from": "gpt", "value": "(B) (0.266, 0.983)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd6be234ea820631.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of translucent fabric at center more distant than that of brown textured fabric at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc06932681ced459.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.370, 0.609) (B) (0.055, 0.439)" }, { "from": "gpt", "value": "(A) (0.370, 0.609)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/886d1793b0f1a2dd.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black backpack at center appear on the right side of denim jeans at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black backpack at center is to the right of denim jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/598437ab10da55e0.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent glass door at left have a larger size compared to yellow plastic sander at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, transparent glass door at left is bigger than yellow plastic sander at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d282fd12f036062c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) metallic bridge at center (B) white glossy ferry at center (C) metallic gray crane at left" }, { "from": "gpt", "value": "(A) metallic bridge at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/170a5d24c2c637f1.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow metallic train at center positioned in front of smooth skin face at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eef7f92040a6381f.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the blue jacket at center? Choose from: (A) red fleece jacket at lower left (B) red fleece jackets at lower center" }, { "from": "gpt", "value": "(A) red fleece jacket at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d55f0a129c81cceb.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue water at center appear under white matte sailboat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, blue water at center is positioned under white matte sailboat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6180a8b00d607f0b.jpg", "conversations": [ { "from": "human", "value": "\nIs green fabric backpack at upper left positioned in front of yellow fabric backpack at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green fabric backpack at upper left is in front of yellow fabric backpack at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a62c94cc147575dc.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green ivy-covered wall at center (B) green leafy tree at center (C) wooden park bench at lower left (D) camouflage fabric jacket at lower left" }, { "from": "gpt", "value": "(A) green ivy-covered wall at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b201c5fef3126f2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.393, 0.750) (B) (0.771, 0.255) (C) (0.830, 0.181)" }, { "from": "gpt", "value": "(A) (0.393, 0.750)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7d8d5ba30ae46c0.jpg", "conversations": [ { "from": "human", "value": "\nDoes teal glossy hair at center appear on the right side of yellow matte mashed potato at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find teal glossy hair at center to the right of yellow matte mashed potato at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/597c34be5bb19dff.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of black lace baby carriage at center in reference to velvet black dress at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/917abae1b563b6bb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.331, 0.842) (B) (0.356, 0.689)" }, { "from": "gpt", "value": "(A) (0.331, 0.842)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ba72df7c495512d.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the white cardboard sign at center? Choose from: (A) matte black hair at lower right (B) white cardboard sign at upper center (C) matte black tank top at upper left (D) matte white sign at center" }, { "from": "gpt", "value": "(D) matte white sign at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef2b4cc9b00701e9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the pink matte flower at upper right? Choose among these: (A) green stone path at center (B) brown textured hay at center (C) yellow matte flower at upper left (D) green leafy vegetation at upper center" }, { "from": "gpt", "value": "(B) brown textured hay at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bae94ffe12cc519.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) metallic woven fabric chair at right (B) black plastic picnic table at center (C) matte plastic plate at center" }, { "from": "gpt", "value": "(B) black plastic picnic table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9e9de05cd83aa64.jpg", "conversations": [ { "from": "human", "value": "\nIs black wire mesh fence at lower right above green matte shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, black wire mesh fence at lower right is below green matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7620c9da9450d39.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.947, 0.431) (B) (0.476, 0.506) (C) (0.383, 0.989) (D) (0.731, 0.467)" }, { "from": "gpt", "value": "(D) (0.731, 0.467)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00342dbcfa931395.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the matte black vest at center? Select from: (A) white fabric at upper right (B) satin dress at center" }, { "from": "gpt", "value": "(B) satin dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/986a9a0572cb1072.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white matte snow at center and white glossy helicopter at upper center in the image provided, where is white matte snow at center located with respect to white glossy helicopter at upper center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ef23f69ab834666.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) white glossy fish at center (B) speckled orange fish at upper left (C) yellow shiny fish at center" }, { "from": "gpt", "value": "(C) yellow shiny fish at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d40878057c543d65.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) vivid orange maple leaf at center (B) wooden picket fence at lower center" }, { "from": "gpt", "value": "(B) wooden picket fence at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf42f90680e52724.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) black t-shirt at center (B) black matte microphone at left" }, { "from": "gpt", "value": "(A) black t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6b2c1b250b47c8d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.380, 0.594) (B) (0.546, 0.659)" }, { "from": "gpt", "value": "(A) (0.380, 0.594)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ede463c4aa866dc5.jpg", "conversations": [ { "from": "human", "value": "\nDoes gold/gilded spire at upper center come behind gold/gilded spire at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, gold/gilded spire at upper center is behind gold/gilded spire at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43de35d1ca18af15.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) bare white tree at center (B) white powdery snow at center" }, { "from": "gpt", "value": "(A) bare white tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d464d0921dabe00.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the polka dot fabric blouse at center? Choose among these: (A) denim jacket at center (B) matte black jacket at center" }, { "from": "gpt", "value": "(A) denim jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/337a52f370c59bfc.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the green grass at center? Choose from: (A) brownhair at center (B) matte skin at center (C) matte skin hand at center (D) lace beige bodysuit at center" }, { "from": "gpt", "value": "(D) lace beige bodysuit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4346a6d24b0f44cf.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white matte shirt at upper center (B) pink matte shirt at center" }, { "from": "gpt", "value": "(B) pink matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/886b67f20f9bcb6d.jpg", "conversations": [ { "from": "human", "value": "\nIs white misty cloud at upper center above white fluffy cloud at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2db642584170b6c7.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent water at center in front of yellow matte kayak at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1deee406564788f3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange cotton t-shirt at left is smaller than black smooth polo shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ab9b8daf871e14b.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray cotton t-shirt at center come in front of light pink fabric at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dark gray cotton t-shirt at center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26e5578bdb96ea92.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black fabric jacket at upper right is positioned above satin khaki shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black fabric jacket at upper right is above satin khaki shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c319a62f4c74a676.jpg", "conversations": [ { "from": "human", "value": "\nDoes green sheer dress at center lie behind camouflage fabric shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddc685d7773eda5d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.925, 0.911) (B) (0.904, 0.627) (C) (0.645, 0.477)" }, { "from": "gpt", "value": "(C) (0.645, 0.477)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/612d6b55b8415ff5.jpg", "conversations": [ { "from": "human", "value": "\nDoes black dotted dress at center come in front of black matte dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5598c98b280c078.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.468, 0.867) (B) (0.448, 0.619)" }, { "from": "gpt", "value": "(A) (0.468, 0.867)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/670cd89ac72c225e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the dark blue blazer at center? Choose among these: (A) smooth blonde hair at upper center (B) patterned scarf at upper left (C) green denim vest at center" }, { "from": "gpt", "value": "(C) green denim vest at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4bf242fa1983b9c.jpg", "conversations": [ { "from": "human", "value": "\nIs brown gravel train track at center in front of metallic brown train at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brown gravel train track at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c23301ec754d6c74.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.480, 0.684) (B) (0.451, 0.334)" }, { "from": "gpt", "value": "(B) (0.451, 0.334)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e52fcc28a8882ac9.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the gray cotton shirt at upper right from the following options: (A) silver metallic laptop at left (B) blue cotton shirt at center (C) blue shirt at center?" }, { "from": "gpt", "value": "(B) blue cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99cdb6fc0df3a8e4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) yellow matte license plate at center (B) white matte van at left (C) yellow matte license plate at rear (D) silver metallic van at center" }, { "from": "gpt", "value": "(D) silver metallic van at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adb8d2316d32ae47.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) multicolored knitted pillow at center (B) black leather swivel chair at center" }, { "from": "gpt", "value": "(A) multicolored knitted pillow at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86d861807adbabf3.jpg", "conversations": [ { "from": "human", "value": "\nIs glistening water at lower center bigger than dark clothing figure at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f15717cfaa941f5.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the brown glass bottle at center among (A) matte glass bottle at right (B) brown glass bottle at left?" }, { "from": "gpt", "value": "(A) matte glass bottle at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d5867ca43f3a332.jpg", "conversations": [ { "from": "human", "value": "\nIs matte white shirt at center positioned before blue fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte white shirt at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cde9342ea8b8e530.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.226, 0.681) (B) (0.878, 0.514)" }, { "from": "gpt", "value": "(A) (0.226, 0.681)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ae34705b23573de.jpg", "conversations": [ { "from": "human", "value": "\nDoes rustic stone church at center appear under blue water at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, rustic stone church at center is above blue water at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8326b447ab28e781.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) dark brown sweater at center (B) dark gray ribbed sweater at center" }, { "from": "gpt", "value": "(B) dark gray ribbed sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d075ffd284c8f4d4.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the green leafy palm tree at left? Choose from: (A) yellow matte school bus at center (B) brown dirt track at lower left (C) green leafy palm tree at upper right (D) metallic silver motorbike at lower left" }, { "from": "gpt", "value": "(B) brown dirt track at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32d0a7b1ef99d92a.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the purple satin blouse at center? (A) concrete stairs at lower left (B) black matte shirt at center" }, { "from": "gpt", "value": "(A) concrete stairs at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e697216eff31ee8.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) black matte dress at right (B) plaid skirt at center" }, { "from": "gpt", "value": "(A) black matte dress at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/053e02f71915aca1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth rock mountain at center is wider than fuzzy white cloud at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, smooth rock mountain at center has a greater width compared to fuzzy white cloud at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdc12d4b8432b532.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) red and white fabric flag at upper center (B) polished stone tower at upper center" }, { "from": "gpt", "value": "(B) polished stone tower at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a6f9c05d0a857b3.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center positioned before white matte van at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy tree at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01fe7e3547d7f7dc.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of brown matte minifigure at lower left in reference to black plastic minifigure at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6c485ee5d18d3a6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) light brown hair at lower center (B) matte blue shirt at center" }, { "from": "gpt", "value": "(B) matte blue shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40a3689e191701ae.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white cardboard cabin at center (B) dark green matte suv at left" }, { "from": "gpt", "value": "(B) dark green matte suv at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67fbc9e00e324503.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white plastic table at lower right and matte black tank top at center in the image provided, where is white plastic table at lower right located with respect to matte black tank top at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79c67b26d8e6d726.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the white cotton shirt at center? (A) matte white blouse at center (B) white cotton dress at center (C) silver metallic van at center (D) white smooth pavement at center" }, { "from": "gpt", "value": "(C) silver metallic van at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82c7a7613236cbb8.jpg", "conversations": [ { "from": "human", "value": "\nIs beige fabric armchair at center to the right of matte white lampshade at upper center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, beige fabric armchair at center is not on the right side of matte white lampshade at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14a99312a43a74f8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) brown wood tree at upper center (B) green striped shirt at center (C) light brown leather jacket at center (D) brown matte shirt at center" }, { "from": "gpt", "value": "(A) brown wood tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ba363b1653c94c9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) green leafy tree at center (B) brown wooden picnic table at center (C) green leafy palm at left, is positioned closest to the white matte/hardobject at center-right?" }, { "from": "gpt", "value": "(A) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd6fe2fd157c1047.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green grass at lower center located in relation to green textured tree at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe8c29d21371c696.jpg", "conversations": [ { "from": "human", "value": "\nIs black silk suit at center bigger than maroon velvet robe at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94b981af8956ad43.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.386, 0.886) (B) (0.774, 0.947) (C) (0.275, 0.475) (D) (0.227, 0.786)" }, { "from": "gpt", "value": "(B) (0.774, 0.947)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4191f773b82498c0.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.256, 0.533) (B) (0.688, 0.080)" }, { "from": "gpt", "value": "(A) (0.256, 0.533)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ebf42b6b918f02d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.386, 0.522) (B) (0.456, 0.839)" }, { "from": "gpt", "value": "(B) (0.456, 0.839)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c1ae7a626ec4e6c.jpg", "conversations": [ { "from": "human", "value": "\nIs matte wood cabin at center to the left of white wooden rail at lower right from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte wood cabin at center is to the left of white wooden rail at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d614b7f68ee3d72.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth metal tracks at center wider than yellow matte train at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a98765a716190cfd.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown water at upper left have a larger size compared to white glass building at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, brown water at upper left has a larger size compared to white glass building at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65fbacbdec954e11.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) gray stone tower at center (B) smooth glass tower at upper right" }, { "from": "gpt", "value": "(B) smooth glass tower at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/890de8bf702d0594.jpg", "conversations": [ { "from": "human", "value": "\nIs green forested mountain at center closer to the viewer compared to shiny black cruise ship at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green forested mountain at center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/225b72196441e4db.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) black fabric street vendor at center (B) transparent plastic umbrella at upper left (C) light gray cotton shorts at center" }, { "from": "gpt", "value": "(C) light gray cotton shorts at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61d8e6bd9764269f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.736, 0.689) (B) (0.420, 0.498)" }, { "from": "gpt", "value": "(A) (0.736, 0.689)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0317925567eddaa3.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) green leafy tree at center (B) green grassy at lower left" }, { "from": "gpt", "value": "(A) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb8f2eb96011848e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the wooden table at center? Choose among these: (A) matte black bottle at left (B) green glass bottle at center" }, { "from": "gpt", "value": "(B) green glass bottle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6dad6498c4b4d518.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton shirt at lower right wider than beige shorts at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white cotton shirt at lower right is wider than beige shorts at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ac267b1b18c5343.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.763, 0.847) (B) (0.622, 0.189) (C) (0.732, 0.523) (D) (0.354, 0.975)" }, { "from": "gpt", "value": "(B) (0.622, 0.189)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72f7256e1d2e5d7e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the floral-patterned shirt at left? (A) wooden podium at center (B) matte white screen at upper center" }, { "from": "gpt", "value": "(B) matte white screen at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3653e5b5bfce58a0.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue shirt at center have a lesser width compared to dark blue fleece vest at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte blue shirt at center is not thinner than dark blue fleece vest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e179123d4e5e9f90.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte white t-shirt at left appear under wooden electric guitar at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte white t-shirt at left is not positioned below wooden electric guitar at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c032ac6e6c56580.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown curly fur dog at left is wider than black fluffy dog at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of brown curly fur dog at left exceeds that of black fluffy dog at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc9c9cf09d03e1c9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy ipod at center is positioned below black plastic nokia phone at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, white glossy ipod at center is above black plastic nokia phone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a23dff02975fb14e.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is woven bamboo boat at center located relative to green rough bark tree at upper left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f461fc8edaabe84e.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange flame helmet at center appear on the left side of dark brown uniform at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, orange flame helmet at center is to the right of dark brown uniform at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50c149d13cdf4ec1.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brown rough skin at center (B) wooden canoe at center (C) smooth water at center" }, { "from": "gpt", "value": "(A) brown rough skin at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cd009117a1e117e.jpg", "conversations": [ { "from": "human", "value": "\nIs camo fabric hoodie at center below brushed metal jacket at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c35c68de2e49890.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white spotted cow at lower left (B) black and white spotted cow at center (C) wire at center" }, { "from": "gpt", "value": "(A) white spotted cow at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49a48bdd07c65302.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the yellow textured paper at center? Choose from: (A) matte red fabric at center (B) orange woven fabric at center (C) metallic hexagonal prism at upper center" }, { "from": "gpt", "value": "(B) orange woven fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ecf467179ca5e2bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.786, 0.833) (B) (0.345, 0.244)" }, { "from": "gpt", "value": "(A) (0.786, 0.833)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbfa3e5ff0f217a3.jpg", "conversations": [ { "from": "human", "value": "\nIs white textured bark at center positioned in front of brown rough bark at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/021df1b06b3dedc3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) glassy reflective building at right (B) transparent glass skyscraper at center" }, { "from": "gpt", "value": "(A) glassy reflective building at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1137b37e0e06f79.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray concrete at bottom is wider than green leafy plant at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, gray concrete at bottom is wider than green leafy plant at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b56063d0fb15138.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black wood table at center is thinner than black silk kimono at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00609ac7507e641e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) brown feathered duck at center (B) brown matte duck at center" }, { "from": "gpt", "value": "(A) brown feathered duck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0dfde4eabda89188.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center behind shiny black chicken at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green grass at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c5197b80b09b5c5.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black shirt at right below white cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte black shirt at right is not below white cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7de5d0ea4170902f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.589, 0.570) (B) (0.939, 0.483)" }, { "from": "gpt", "value": "(A) (0.589, 0.570)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d6a8c72d20c4772.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.696, 0.863) (B) (0.780, 0.709) (C) (0.323, 0.520)" }, { "from": "gpt", "value": "(B) (0.780, 0.709)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5879bbb300d5a80a.jpg", "conversations": [ { "from": "human", "value": "\nDoes camouflage fabric soldier at lower right lie behind camouflage fabric uniform at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of camouflage fabric uniform at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6578a580a930466b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.817, 0.377) (B) (0.308, 0.570)" }, { "from": "gpt", "value": "(A) (0.817, 0.377)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4563fce9d74fd55c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.336, 0.595) (B) (0.474, 0.637)" }, { "from": "gpt", "value": "(A) (0.336, 0.595)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52aac294e5735d5f.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green grassy at lower left less distant than that of brown sand at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/244f477982687757.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) matte orange-roofed houses at center (B) matte pink cloud at upper center" }, { "from": "gpt", "value": "(B) matte pink cloud at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4b90732a7bd70a6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) shiny black tank at upper right (B) white plastic tank at center" }, { "from": "gpt", "value": "(A) shiny black tank at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fdd043b3785184e.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of brown carved wood archway at center in reference to brown leather chair at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79d5427c2e28f521.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the dark brown rock at center? Select from: (A) gray rough rock at center (B) smooth skin boy at center" }, { "from": "gpt", "value": "(A) gray rough rock at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/701949eeada3cf2e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue fabric shirt at lower left is positioned to the left of black matte speaker at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find blue fabric shirt at lower left to the left of black matte speaker at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f795f5cfcb54b3ce.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white checkered fabric mask at right is positioned to the right of smooth skin face at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white checkered fabric mask at right is to the right of smooth skin face at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4c21e826c735d92.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown leather jacket at center lie behind dark blue hoodie at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fefa18fba72846a.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth bark tree at center have a smaller size compared to smooth sand at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32164c537fd0817a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.097, 0.959) (B) (0.366, 0.714) (C) (0.510, 0.355) (D) (0.581, 0.572)" }, { "from": "gpt", "value": "(A) (0.097, 0.959)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/130d34e0be9a7564.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown muddy water at lower center lie behind green leafy palm tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of green leafy palm tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/024a937b64c3b726.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.501, 0.327) (B) (0.839, 0.397) (C) (0.854, 0.472) (D) (0.316, 0.709)" }, { "from": "gpt", "value": "(D) (0.316, 0.709)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f505131fdd2468f0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) green leafy tree at center (B) brown dry grass at center" }, { "from": "gpt", "value": "(B) brown dry grass at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/502dda0bda3395dc.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue water at center have a smaller size compared to dark gray stone tower at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16e4fe99c6386605.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) gray textured suit at center (B) gray textured tie at center" }, { "from": "gpt", "value": "(A) gray textured suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ecb99c7e4553777.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.380, 0.619) (B) (0.379, 0.386) (C) (0.457, 0.744)" }, { "from": "gpt", "value": "(B) (0.379, 0.386)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e9b5c64ae119eeb.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the black matte arm at upper right? Choose among these: (A) gray matte tank top at center (B) black matte phone at right (C) gray cotton t-shirt at center" }, { "from": "gpt", "value": "(B) black matte phone at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/081f2ee59b6f5c28.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the dark brown suit at center among (A) dark brown hair at lower right (B) wooden table at center?" }, { "from": "gpt", "value": "(B) wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/315b3919a6ba71bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.956, 0.733) (B) (0.733, 0.556)" }, { "from": "gpt", "value": "(B) (0.733, 0.556)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2579cc8b75fd2488.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue building at center have a lesser width compared to shiny silver bicycle at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01c007b3aad894a4.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center have a smaller size compared to muddy water at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/178b234e8e546adf.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte shirt at center positioned behind silver metallic laptop at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b60fbe14cceb4e3a.jpg", "conversations": [ { "from": "human", "value": "\nDoes light brown leather jacket at upper right appear on the left side of black leather jacket at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, light brown leather jacket at upper right is to the right of black leather jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96015d042c983a19.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte blue shirt at upper left (B) blue plaid shirt at center (C) snowy mountain at upper center (D) matte blue shorts at center" }, { "from": "gpt", "value": "(C) snowy mountain at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69ab2d1572315f57.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue satin dress at center have a larger size compared to decorated christmas tree at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, blue satin dress at center is not larger than decorated christmas tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fe09d84950daba2.jpg", "conversations": [ { "from": "human", "value": "\nIs white shirt at upper center to the right of satin white dress at upper center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white shirt at upper center is to the right of satin white dress at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6315bb84268831d8.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at upper right appear over brown wooden balcony at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green leafy tree at upper right is above brown wooden balcony at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d766be7a0cd0b25b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy bush at right is positioned above brown wooden fence at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green leafy bush at right is positioned over brown wooden fence at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19c44255619a2f00.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black dotted dress at left is positioned to the left of white smooth onesie at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, black dotted dress at left is positioned on the left side of white smooth onesie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d2cde8355dc60b4.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow-blue fabric flag at upper left have a larger size compared to smooth wood pole at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76d9922f45d3ab30.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.433, 0.298) (B) (0.736, 0.447) (C) (0.155, 0.062)" }, { "from": "gpt", "value": "(A) (0.433, 0.298)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ff25902182d5341.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny black car at center is positioned to the right of matte silver van at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, shiny black car at center is not to the right of matte silver van at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1a034e208e960ce.jpg", "conversations": [ { "from": "human", "value": "\nDoes red fabric jacket at left appear over yellow shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, red fabric jacket at left is not above yellow shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38b0c1806216d1d5.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte gray jacket at center have a lesser width compared to striped wool sweater at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, matte gray jacket at center has a lesser width compared to striped wool sweater at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfec5f6020853cbd.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fluffy cloud at upper center come in front of white fluffy cloud at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white fluffy cloud at upper center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05428056f43faf27.jpg", "conversations": [ { "from": "human", "value": "\nIs satin black range rover at center closer to camera compared to black plastic license plate at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91df3c3af0d16f3c.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red jacket at upper left to the right of transparent plastic glasses at lower center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte red jacket at upper left is not on the right side of transparent plastic glasses at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cac653bf56bc7872.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of printed fabric skirt at center more distant than that of paisley-patterned skirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, printed fabric skirt at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea34a870480cb312.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white matte sedan at center (B) white metallic car at center (C) metallic pole at center" }, { "from": "gpt", "value": "(C) metallic pole at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/334a2a487b42da82.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden barrel at right to the right of wooden barrel at center-right from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, wooden barrel at right is to the right of wooden barrel at center-right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26e2e034db801aff.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) pink fabric at center (B) matte blue electric guitar at center, is positioned closest to the shiny orange electric guitar at center?" }, { "from": "gpt", "value": "(B) matte blue electric guitar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d92af2fa6527e49.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green leafy tree at center (B) green leafy tree at lower right (C) matte yellow wood house at center (D) matte yellow wood cottage at center" }, { "from": "gpt", "value": "(A) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92e44b76538b0e54.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the denim jacket at center? (A) orange cotton shirt at center (B) orange jumpsuit at right" }, { "from": "gpt", "value": "(B) orange jumpsuit at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3773c7793adef4e1.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of matte black fireplace at center in reference to white plastic window at upper right? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94ffd1d42ea01098.jpg", "conversations": [ { "from": "human", "value": "\nIs dried grass at center smaller than camouflage fabric uniform at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dried grass at center is not smaller than camouflage fabric uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77be56a0157eda56.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) brown tiled roofs at center (B) white matte church at center (C) white smooth building at center, is positioned closest to the white stucco clock tower at center?" }, { "from": "gpt", "value": "(B) white matte church at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/494eca7ab6ba94cc.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) yellow jersey at center (B) green grass at lower center (C) matte purple bandana at center" }, { "from": "gpt", "value": "(B) green grass at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e86241c1e3f1ce84.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth concrete stairs at center below matte gray skirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, smooth concrete stairs at center is below matte gray skirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a77a84583e1105b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) purple synthetic rope at center (B) camouflage fabric climbing harness at center" }, { "from": "gpt", "value": "(B) camouflage fabric climbing harness at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43505377aa2a5ce1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.815, 0.820) (B) (0.128, 0.869) (C) (0.725, 0.648) (D) (0.422, 0.658)" }, { "from": "gpt", "value": "(C) (0.725, 0.648)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/156ed02d4013f8f8.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) brown matte hair at upper center (B) tan straw baseball hat at upper center (C) pearl necklace at center (D) brown mesh cap at upper center" }, { "from": "gpt", "value": "(D) brown mesh cap at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68534aa9bcea4ecc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.496, 0.541) (B) (0.454, 0.656)" }, { "from": "gpt", "value": "(A) (0.496, 0.541)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45ceea74bd651aa0.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black matte t-shirt at center located in relation to white jersey at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e63e735fac74bf6f.jpg", "conversations": [ { "from": "human", "value": "\nDoes black plastic video camera at upper right lie behind black dotted fabric tie at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black plastic video camera at upper right is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21934f107aae40f2.jpg", "conversations": [ { "from": "human", "value": "\nDoes foggy reflective water at center appear on the right side of green matte tree at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find foggy reflective water at center to the right of green matte tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1056d8ca4ce38863.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) white striped shirt at center (B) brown wooden table at center" }, { "from": "gpt", "value": "(B) brown wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c14904f887a512c5.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at upper right have a smaller size compared to green leafy plant at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/337470050f8ac68e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.497, 0.620) (B) (0.325, 0.386)" }, { "from": "gpt", "value": "(B) (0.325, 0.386)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f570daa58fae78e.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown rough log at center lie behind dark blue shirt at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, brown rough log at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39a6aa57a45aba1f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.688, 0.634) (B) (0.227, 0.542) (C) (0.712, 0.486)" }, { "from": "gpt", "value": "(A) (0.688, 0.634)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16adc60d0f258348.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the brown sandy dirt at center? Choose from: (A) brown dry bush at left (B) green leafy bush at center (C) black fur dog at center" }, { "from": "gpt", "value": "(B) green leafy bush at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5a2cdbf2b7fc9fb.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray shirt at center appear over blue woven tie at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9b9e67488c2d4c4.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic silver train at center thinner than yellow matte building at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, metallic silver train at center is not thinner than yellow matte building at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4015b2202545e00b.jpg", "conversations": [ { "from": "human", "value": "\nIs bronze statue at center thinner than shiny bronze statue at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, bronze statue at center might be wider than shiny bronze statue at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a486650ef25c9d8f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) dark blue shirt at center (B) matte silver pole at right" }, { "from": "gpt", "value": "(B) matte silver pole at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/baba609051b0df52.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white painted wood sign at lower left (B) green leafy tree at upper right (C) white wooden sign at lower left (D) green textured tree at upper left" }, { "from": "gpt", "value": "(B) green leafy tree at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01edc5b654d1c805.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte machine gun at center appear on the right side of barbed wire at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, black matte machine gun at center is not to the right of barbed wire at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf981b45850eaa42.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.972, 0.784) (B) (0.124, 0.836)" }, { "from": "gpt", "value": "(A) (0.972, 0.784)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c132d085b696b43.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.245, 0.509) (B) (0.814, 0.727)" }, { "from": "gpt", "value": "(A) (0.245, 0.509)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b0548110d8c1a2e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the snowy granite mountain range at center among (A) green matte tree at center (B) white fluffy cloud at upper right?" }, { "from": "gpt", "value": "(B) white fluffy cloud at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0427fdf3a86f66b.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black apron at center appear on the left side of metallic silver pen at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black apron at center is to the left of metallic silver pen at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f31c274ab228e7fb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black jacket at center is bigger than blue denim jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, matte black jacket at center has a larger size compared to blue denim jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42330432d56ad741.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black keyboard at center further to the viewer compared to blonde hair at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte black keyboard at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/007632be12e165d9.jpg", "conversations": [ { "from": "human", "value": "\nIs red fabric shorts at right below matte red shorts at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, red fabric shorts at right is not positioned below matte red shorts at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4f510c0bc111fb5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.638, 0.450) (B) (0.398, 0.605) (C) (0.623, 0.762)" }, { "from": "gpt", "value": "(A) (0.638, 0.450)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fe98436e814c634.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of black textured sweater at left in relation to smooth skin face at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dafdf12d0b2be6b8.jpg", "conversations": [ { "from": "human", "value": "\nDoes checkered wool coat at center have a smaller size compared to dark green suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, checkered wool coat at center has a smaller size compared to dark green suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d314ace773db89f8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) matte brown wooden hut at center (B) green reflective water at center" }, { "from": "gpt", "value": "(B) green reflective water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba7c1b55ca92d084.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black suit at center is bigger than concrete curb at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte black suit at center is not bigger than concrete curb at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e90c4a288e044a7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) black glass sign at center (B) pink matte trash can at center" }, { "from": "gpt", "value": "(A) black glass sign at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f0ab77e03460728.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.288, 0.216) (B) (0.623, 0.966) (C) (0.776, 0.539)" }, { "from": "gpt", "value": "(A) (0.288, 0.216)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b305c1e6b1e2c46.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte jacket at center is positioned to the right of black plastic sunglasses at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, black matte jacket at center is not on the right side of black plastic sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fceae16dfa14002.jpg", "conversations": [ { "from": "human", "value": "\nIs leather wristwatch at lower left bigger than matte black tank top at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, leather wristwatch at lower left might be smaller than matte black tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58991ea6ec00dbec.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green painted metal clock tower at upper center located in relation to matte black clock at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3dbee2a5a56fa99.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.087, 0.825) (B) (0.906, 0.758) (C) (0.350, 0.362)" }, { "from": "gpt", "value": "(A) (0.087, 0.825)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/279449d482dba63e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.232, 0.361) (B) (0.658, 0.958) (C) (0.691, 0.822) (D) (0.488, 0.514)" }, { "from": "gpt", "value": "(B) (0.658, 0.958)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cebcdb82dc9425b1.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of ripped denim jeans at center less distant than that of green matte bowling ball at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/006b275b83fa5660.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of red fabric shorts at lower right and blue fabric person at lower right in the image provided, where is red fabric shorts at lower right located with respect to blue fabric person at lower right? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/176083328d2ff96b.jpg", "conversations": [ { "from": "human", "value": "\nDoes blonde curly hair at center come in front of white matte bomber jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/716110ddf7c7bba3.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) matte brown tarpaulin boat at center (B) brown tarpaulin boat at center" }, { "from": "gpt", "value": "(A) matte brown tarpaulin boat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98005e4b0189d5f3.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of glassy silver skyscraper at center in reference to matte glass skyscraper at center-left? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58fcce17c68fa84b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.465, 0.286) (B) (0.635, 0.409)" }, { "from": "gpt", "value": "(B) (0.635, 0.409)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01a7ece5a0373763.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte cardboard box at center have a greater width compared to black glossy phone at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/695ed9d948e80225.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) silhouette bare tree at lower center (B) white fluffy cloud at upper center (C) silhouette bare tree at center (D) white powdery snow at lower center" }, { "from": "gpt", "value": "(D) white powdery snow at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7683fc6c99e5be87.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.344, 0.842) (B) (0.793, 0.153) (C) (0.347, 0.602) (D) (0.421, 0.000)" }, { "from": "gpt", "value": "(D) (0.421, 0.000)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/093a78334ed753d0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.584, 0.609) (B) (0.291, 0.891) (C) (0.805, 0.828)" }, { "from": "gpt", "value": "(A) (0.584, 0.609)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51fe9387ef7d1268.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) white wood gazebo at center (B) green grass at lower center" }, { "from": "gpt", "value": "(A) white wood gazebo at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03e7457d6a6ae9ce.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white plastic desktop computer at center is thinner than green glossy leaf at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white plastic desktop computer at center's width is not less than green glossy leaf at upper right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be6b4dfb3302b0e6.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black metal pole at upper left located in relation to silver metallic pole at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/059f048ec642750f.jpg", "conversations": [ { "from": "human", "value": "\nDoes satin silver sedan at center appear under shiny chrome motorcycle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, satin silver sedan at center is located below shiny chrome motorcycle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a7268fe58ca9d22.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white matte shirt at center (B) dark brown hair at lower right (C) red plaid shirt at lower right" }, { "from": "gpt", "value": "(A) white matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73150a0b7f88d432.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.135, 0.975) (B) (0.541, 0.694) (C) (0.254, 0.369)" }, { "from": "gpt", "value": "(B) (0.541, 0.694)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69cbaabd3161b5f1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) gray stone dog at left (B) green rubber frog at center (C) green leafy tree at center (D) shiny black stone dog at center" }, { "from": "gpt", "value": "(C) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5110379d40a8c1b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) metallic yellow train at center (B) white matte figure at center" }, { "from": "gpt", "value": "(B) white matte figure at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/051a2f8eaf998615.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) khaki pants at lower center (B) matte black camera at center" }, { "from": "gpt", "value": "(A) khaki pants at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96936492bb9dbf73.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) gray pebbled beach at center (B) gray weathered wood log at lower left" }, { "from": "gpt", "value": "(A) gray pebbled beach at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a86ae1385fe7622.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the brown stone pillar at center? Select from: (A) woven brown chair at center (B) clear glass table at center (C) beige stone pillar at center (D) beige concrete pillar at center" }, { "from": "gpt", "value": "(A) woven brown chair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e985711fc67e27f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the matte red shirt at center? Select from: (A) blue leather jacket at center (B) red fabric shirt at center" }, { "from": "gpt", "value": "(A) blue leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01777ac68a7f3c5c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.930, 0.611) (B) (0.842, 0.420)" }, { "from": "gpt", "value": "(B) (0.842, 0.420)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39007b4d79503966.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) silver metallic pillar at center (B) transparent plastic city model at center" }, { "from": "gpt", "value": "(B) transparent plastic city model at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e406b4d6abf0ebb5.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy trees at center further to camera compared to green leafy tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f04cf5cf88263ce.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue plaid shirt at center appear over matte black monitor at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a97273ff44c740bb.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green cotton shirt at center more distant than that of matte brown cardboard box at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green cotton shirt at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/537c4080ba6e5374.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) blue plush bird at center (B) green cotton shirt at right (C) striped cotton dress at center" }, { "from": "gpt", "value": "(A) blue plush bird at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5308043503d00c1e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.716, 0.625) (B) (0.296, 0.648)" }, { "from": "gpt", "value": "(A) (0.716, 0.625)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/874fe56adfbf0721.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte plastic hand at center (B) white rubber bracelet at lower right" }, { "from": "gpt", "value": "(A) matte plastic hand at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13f157037d59b59c.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the black plastic laptop at lower left from the following options: (A) black matte scarf at upper center (B) silver metallic laptop at center-right (C) black fabric braids at upper right (D) black matte scarf at upper left?" }, { "from": "gpt", "value": "(D) black matte scarf at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/587b524f8c1ca7ca.jpg", "conversations": [ { "from": "human", "value": "\nIs camouflage uniform at center to the right of dark blue wool coat at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, camouflage uniform at center is positioned on the right side of dark blue wool coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be39c97911aca16e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white frosted glass at upper center is thinner than clear glass window at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, white frosted glass at upper center might be wider than clear glass window at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f55df5d2b52c2e10.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte orange jumpsuit at center is wider than matte red shirt at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte orange jumpsuit at center is not wider than matte red shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03e2d3336c54aa45.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue glossy book at center appear on the right side of shiny metallic table at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, blue glossy book at center is not on the right side of shiny metallic table at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a96d59379721f0fb.jpg", "conversations": [ { "from": "human", "value": "\nWhere is blue water at center located in relation to white textured shirt at right in the image? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ecde74080a088e5.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink checkered shirt at center come in front of shiny skin boy at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, pink checkered shirt at center is in front of shiny skin boy at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5feb8f8a9a94a31d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte gray guitar at left is bigger than dark blue patterned shirt at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte gray guitar at left is larger in size than dark blue patterned shirt at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/184d64eb37437b41.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange cotton t-shirt at center is positioned below black lace top at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, orange cotton t-shirt at center is below black lace top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d38e62dbf075dbf.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.876, 0.741) (B) (0.124, 0.152)" }, { "from": "gpt", "value": "(B) (0.124, 0.152)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e997952dc4469c0.jpg", "conversations": [ { "from": "human", "value": "\nIs teal floral blouse at center smaller than clear glass wine glass at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, teal floral blouse at center is not smaller in size than clear glass wine glass at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1cf4c19ab851063.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.194, 0.534) (B) (0.778, 0.683)" }, { "from": "gpt", "value": "(B) (0.778, 0.683)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8b4d3ff3053372d.jpg", "conversations": [ { "from": "human", "value": "\nIs green smooth water at center below smooth red bridge at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green smooth water at center is positioned under smooth red bridge at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/308d5391561db46c.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white matte shirt at left in reference to dark blue t-shirt at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df1a4f3ca591a83a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) green leafy tree at center (B) white glossy train at center (C) green leafy tree at right" }, { "from": "gpt", "value": "(C) green leafy tree at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b6c08ffdc28f9a9.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of black glossy eye at upper left in reference to black glossy eye at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70d3ef1812cdf724.jpg", "conversations": [ { "from": "human", "value": "\nDoes speckled brown fish at center appear on the right side of translucent blue segmented worm at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, speckled brown fish at center is to the left of translucent blue segmented worm at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0778a9d15ffd514.jpg", "conversations": [ { "from": "human", "value": "\nIs green glass traffic light at left smaller than white plastic license plate at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, green glass traffic light at left is not smaller in size than white plastic license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5e9e0e266586db5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.634, 0.233) (B) (0.873, 0.347)" }, { "from": "gpt", "value": "(A) (0.634, 0.233)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01d5a328230cd142.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black swim trunks at center located in relation to tan skin man at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a697522faf3cb07.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the green mossy rock at lower right? (A) gray mossy rock at lower right (B) smooth gray rock at lower right" }, { "from": "gpt", "value": "(A) gray mossy rock at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/689476f9521847c7.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center below wooden sculpture at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green grass at center is not below wooden sculpture at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05799a0849d9c63d.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center have a greater width compared to green leafy tree at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy tree at center is wider than green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10b0a4869bbd2845.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) smooth reflective water at center (B) golden-brown foliage at center" }, { "from": "gpt", "value": "(A) smooth reflective water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b41aade2b20cbe0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white marble stairs at lower center is positioned to the right of white marble stairs at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white marble stairs at lower center is not to the right of white marble stairs at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/863c18d6e904a4d4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte plastic atm at center is thinner than white matte skirt at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, matte plastic atm at center might be wider than white matte skirt at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c1e31c26a651624.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.909, 0.781) (B) (0.515, 0.272) (C) (0.429, 0.559) (D) (0.195, 0.181)" }, { "from": "gpt", "value": "(D) (0.195, 0.181)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9562af115156a847.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if khaki cotton pants at right is positioned to the right of black plastic sunglasses at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, khaki cotton pants at right is to the right of black plastic sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14b4d8e2975d4112.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.458, 0.866) (B) (0.500, 0.589)" }, { "from": "gpt", "value": "(A) (0.458, 0.866)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42b33a63d2ff4057.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown leather bag at center come in front of metallic gray chair at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/daebc735b1f025bc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white shirt at center is positioned below pink fabric at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ecf0b3f70ce98c83.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) matte white cup at upper left (B) white glossy cup at upper center" }, { "from": "gpt", "value": "(B) white glossy cup at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/019e27e71c7c4877.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the white matte cup at center? Choose among these: (A) porcelain plate with food remnants at center (B) clear plastic cup at lower center" }, { "from": "gpt", "value": "(B) clear plastic cup at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/329c2cf0063e4326.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.263, 0.389) (B) (0.331, 0.536) (C) (0.123, 0.444)" }, { "from": "gpt", "value": "(B) (0.331, 0.536)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78c1989056c344d3.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the green grass at lower center? Choose from: (A) yellow fabric parachute at upper center (B) snowy white mountain range at upper center" }, { "from": "gpt", "value": "(A) yellow fabric parachute at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d6cd3655be0c1d2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden table at center is thinner than yellow matte hand at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, wooden table at center's width is not less than yellow matte hand at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30735642c545e845.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light blue fabric shirt at center is positioned to the right of yellow fabric shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, light blue fabric shirt at center is to the left of yellow fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/beb5b74fc8641b02.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.962, 0.269) (B) (0.448, 0.225) (C) (0.669, 0.675)" }, { "from": "gpt", "value": "(A) (0.962, 0.269)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c032548035d9684f.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown suit at center appear over patterned silk tie at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, dark brown suit at center is above patterned silk tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07c44f3b7f0c93a0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) white plastic monitor at center (B) white plastic keyboard at lower center" }, { "from": "gpt", "value": "(B) white plastic keyboard at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6f1ad8d0499401c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) bronze statue at center (B) rustic stone at center" }, { "from": "gpt", "value": "(A) bronze statue at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c05c164a4e4301e7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dry grass at center is positioned below green textured tree at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08a69dd00d346553.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy bush at center right bigger than green leafy hedge at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green leafy bush at center right has a larger size compared to green leafy hedge at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c99e173111bc2ffd.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) brown leather sandals at lower center (B) shiny gold bracelet at lower center (C) matte black dress at lower left" }, { "from": "gpt", "value": "(C) matte black dress at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6dbf69d5dee5e24b.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow matte train at center smaller than red plastic stop sign at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d5c7ee633209b7c.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent glass car window at left have a larger size compared to matte black jacket at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, transparent glass car window at left is larger in size than matte black jacket at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/122709f502104dc8.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green leafy hedge at lower right and green leafy hedge at lower left in the image provided, where is green leafy hedge at lower right located with respect to green leafy hedge at lower left? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2647a6ab01ccbd61.jpg", "conversations": [ { "from": "human", "value": "\nIs matte plastic bag of dried fruits at center to the right of blue apron at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte plastic bag of dried fruits at center is to the right of blue apron at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04723acc84beb463.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if maroon sweater at center is bigger than light gray shirt at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, maroon sweater at center has a larger size compared to light gray shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/024113a6916f0fe0.jpg", "conversations": [ { "from": "human", "value": "\nIs brown cardboard box at upper left smaller than white glossy table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, brown cardboard box at upper left occupies less space than white glossy table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a41ccce385c14780.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is metallic pole at center located relative to white paper sign at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8afc257ac9a3192.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the gray matte penguin at center? Choose from: (A) smooth gray penguin at center (B) black glossy penguin at center" }, { "from": "gpt", "value": "(A) smooth gray penguin at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73e6e65f12fe0371.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray concrete building at center is positioned to the right of dark gray stone clock at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, gray concrete building at center is not on the right side of dark gray stone clock at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df9fe5c48cdf96a6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic red number at center is positioned above smooth stone spire at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, metallic red number at center is not positioned above smooth stone spire at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88f0e6618e7f8ba8.jpg", "conversations": [ { "from": "human", "value": "\nIs rusty metal truck at center to the left of green leafy tree at right from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, rusty metal truck at center is to the left of green leafy tree at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cce1f42384ad12e.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth brown tree trunk at center thinner than green painted wood sign at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/687dad30424f578d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.298, 0.316) (B) (0.765, 0.058)" }, { "from": "gpt", "value": "(A) (0.298, 0.316)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f9943660aea98fa.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) light gray suit at center (B) black matte laptop at right" }, { "from": "gpt", "value": "(B) black matte laptop at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b97f56c6a19204bf.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) metallic aviator sunglasses at center (B) red fabric jacket at center" }, { "from": "gpt", "value": "(A) metallic aviator sunglasses at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99b721b9627b22ec.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic green and white race car at left is thinner than metallic blue race car at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02693776749e9108.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth asphalt tarmac at center is bigger than shiny metallic airplane at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, smooth asphalt tarmac at center is larger in size than shiny metallic airplane at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f12b60861ccd03af.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) blue water at center (B) green leafy bush at left" }, { "from": "gpt", "value": "(A) blue water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0b689310363a4e7.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) light pink fabric dress at center (B) polka dot fabric dress at center (C) golden fur dog at lower left (D) white fluffy pony at right" }, { "from": "gpt", "value": "(C) golden fur dog at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8951b6d9127def99.jpg", "conversations": [ { "from": "human", "value": "\nIs white plastic dock at right positioned before shiny white sailboat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white plastic dock at right is in front of shiny white sailboat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5110df26a0ad9f8.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) rainbow striped hot air balloon at center (B) multicolored striped hot air balloon at center" }, { "from": "gpt", "value": "(B) multicolored striped hot air balloon at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcb578236a6d9ceb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.826, 0.370) (B) (0.542, 0.756)" }, { "from": "gpt", "value": "(A) (0.826, 0.370)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c43d67c87fda686e.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fabric at center appear on the left side of floral-patterned blouse at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find white fabric at center to the left of floral-patterned blouse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/623fa1dfa00a6ab7.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) matte beige blouse at center (B) gray textured skirt at right (C) dark gray textured dress at center (D) smooth asphalt pavement at center" }, { "from": "gpt", "value": "(D) smooth asphalt pavement at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5cc4d893b346fd5c.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark stone stairs at center appear on the right side of black stone pillar at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, dark stone stairs at center is not on the right side of black stone pillar at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f9820ab7e35e98e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if maroon woolen robe at center is positioned below striped fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, maroon woolen robe at center is above striped fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/576cbf968b2ee556.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if camouflage uniform at left is bigger than camouflage fabric at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44acecfe82a35aa7.jpg", "conversations": [ { "from": "human", "value": "\nIs orange glossy car at center bigger than white teeth plastic mouth at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, orange glossy car at center has a larger size compared to white teeth plastic mouth at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5263c8f3d3542ae8.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte gray t-shirt at center in relation to gray cotton t-shirt at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20556607c7277159.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white woven hat at upper center and clear water at creek center in the image provided, where is white woven hat at upper center located with respect to clear water at creek center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f9ba6010cf96be3.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grassy at center have a larger size compared to stone cross at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green grassy at center is not bigger than stone cross at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa03cb7c913fe083.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte can at center further to camera compared to green ribbed sweater at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b06f952f794a398.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) gray matte pigeon at center (B) speckled gray pigeon at center (C) matte gray pigeon at left (D) purple iridescent pigeon at center" }, { "from": "gpt", "value": "(C) matte gray pigeon at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d7954bbacc5acb4.jpg", "conversations": [ { "from": "human", "value": "\nIs matte white sweater at left to the right of black matte microphone at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, matte white sweater at left is to the left of black matte microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c92e06c9f14cacbf.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green camouflage netting at center located in relation to brown wire mesh fence at lower center in the image? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c643dd6a930127f1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) black metallic microphone at upper left (B) floral-patterned fabric dress at center (C) pink matte sweater at center" }, { "from": "gpt", "value": "(A) black metallic microphone at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b08cf3a90f1ab14.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the black matte shirt at lower right among (A) pink textured sweater at center (B) silver metallic laptop at lower center (C) beige suede jacket at center?" }, { "from": "gpt", "value": "(B) silver metallic laptop at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca81a098edfabc2f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte van at lower left is smaller than metallic pink tower at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white matte van at lower left has a smaller size compared to metallic pink tower at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a0044ffb51fdea4.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray suit at left bigger than dark gray fabric dress at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13012f02f74f9e14.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte helmet at center appear on the left side of black matte helmet at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white matte helmet at center is not on the left side of black matte helmet at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d9fcb195834afe2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) shiny black suit at upper right (B) white shirt at left (C) matte gray suit at center (D) dark gray suit at center" }, { "from": "gpt", "value": "(A) shiny black suit at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7838357927958405.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red argyle sweater vest at center is positioned to the right of black denim skirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, red argyle sweater vest at center is positioned on the right side of black denim skirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/925039f929325894.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green textured tree at center is positioned to the left of green grass at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, green textured tree at center is to the right of green grass at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4463616e48da8f0b.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of brown tweed pants at center more distant than that of leather jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e2b5e3a3c350d6a.jpg", "conversations": [ { "from": "human", "value": "\nIs green fabric shirt at center above pink fabric at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ba8904b5037348e.jpg", "conversations": [ { "from": "human", "value": "\nIs leather jacket at center wider than striped woolen hat at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, leather jacket at center's width does not surpass striped woolen hat at upper center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/347d02c2d28e09b7.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) gray striped shirt at right (B) floral fabric dress at lower left (C) black plastic microphone at upper right (D) matte blue scarf at center" }, { "from": "gpt", "value": "(D) matte blue scarf at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6f01bc858406b08.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) white fabric shorts at lower right (B) white fabric shoe at lower right (C) gray concrete pavement at lower left" }, { "from": "gpt", "value": "(C) gray concrete pavement at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec1ab69647c1b8cc.jpg", "conversations": [ { "from": "human", "value": "\nIs brown leather jacket at center positioned at the back of matte blue jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brown leather jacket at center is behind matte blue jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28f345bee8e8c1b2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at center is bigger than metallic silver chair at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, green leafy tree at center might be smaller than metallic silver chair at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd4b113f317c3e13.jpg", "conversations": [ { "from": "human", "value": "\nDoes black chalkboard at center have a larger size compared to matte gray backpack at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f5541df60e159e5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) brown matte paella at center (B) shiny metal wok at center (C) black cotton shirt at right" }, { "from": "gpt", "value": "(C) black cotton shirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0f39eb0de183ba0.jpg", "conversations": [ { "from": "human", "value": "\nWhere is yellow matte shirt at center located in relation to light beige shirt at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/724f6855b0e38b18.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) black metallic microphone at upper center (B) wooden drum at center (C) green wood drum at left" }, { "from": "gpt", "value": "(C) green wood drum at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b0e40f9e872c656.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.525, 0.473) (B) (0.403, 0.103) (C) (0.787, 0.869)" }, { "from": "gpt", "value": "(C) (0.787, 0.869)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05f6a942eebc69de.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the shiny red firetruck at center? Choose from: (A) metallic silver door at center (B) shiny red fire truck at left" }, { "from": "gpt", "value": "(B) shiny red fire truck at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04e8c040cbfb2e09.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte coat at center below fluffy beige dog at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, black matte coat at center is above fluffy beige dog at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce9b604cb68a2a7b.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green leafy tree at upper center in relation to white paper sign at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e71fdc48005bcacb.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.970, 0.092) (B) (0.215, 0.963)" }, { "from": "gpt", "value": "(A) (0.970, 0.092)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a217b690e1698744.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of orange fabric shirt at center more distant than that of matte green helmet at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, orange fabric shirt at center is further from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1ed2ebdfc6f15de.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth skin man at center appear on the right side of smooth skin child at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, smooth skin man at center is not to the right of smooth skin child at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbc401a457008168.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black rubber tire at upper left is positioned to the left of matte pink backpack at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, black rubber tire at upper left is not on the left side of matte pink backpack at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86cb4a574a4c4ba9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.343, 0.128) (B) (0.712, 0.400)" }, { "from": "gpt", "value": "(A) (0.343, 0.128)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0603d11911a109f0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.820, 0.528) (B) (0.858, 0.595) (C) (0.114, 0.602)" }, { "from": "gpt", "value": "(A) (0.820, 0.528)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63755cb7b10ecdd7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.335, 0.691) (B) (0.996, 0.342)" }, { "from": "gpt", "value": "(B) (0.996, 0.342)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31cd121419551298.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the matte gray building at right? Choose among these: (A) silver metallic bicycle at lower center (B) silver metallic bicycle at lower right" }, { "from": "gpt", "value": "(A) silver metallic bicycle at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f00963f294be0ce.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.582, 0.212) (B) (0.881, 0.812) (C) (0.418, 0.497) (D) (0.264, 0.123)" }, { "from": "gpt", "value": "(A) (0.582, 0.212)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/788e886114b50f9c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brown stone spire at lower left (B) dark gray stone spire at center" }, { "from": "gpt", "value": "(A) brown stone spire at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/539cdaa2ed526f8d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.566, 0.291) (B) (0.562, 0.675)" }, { "from": "gpt", "value": "(B) (0.562, 0.675)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/913144e148ec110c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.922, 0.720) (B) (0.739, 0.736) (C) (0.807, 0.744)" }, { "from": "gpt", "value": "(B) (0.739, 0.736)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/020896c3b64cc356.jpg", "conversations": [ { "from": "human", "value": "\nDoes red matte shirt at lower left lie in front of green matte bicycle at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7036f0e312acf291.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) light brown skin at upper left (B) green plastic sippy cup at lower right (C) matte black shirt at upper left (D) pink fleece jacket at left" }, { "from": "gpt", "value": "(B) green plastic sippy cup at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e89dc161d744a13.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the stone castle at center? Choose among these: (A) green rough bark tree at center (B) green leafy tree at left (C) green leafy tree at center" }, { "from": "gpt", "value": "(C) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7b995bbbb45dc6d.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte shirt at center appear over striped cotton shirt at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black matte shirt at center is not positioned above striped cotton shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3aab67fd704158c2.jpg", "conversations": [ { "from": "human", "value": "\nDoes white cotton shirt at center have a smaller size compared to white cotton shirt at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white cotton shirt at center is not smaller than white cotton shirt at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08d6eb11b9eaa104.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light brown sandy beach at lower right is bigger than clear water at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, light brown sandy beach at lower right is not bigger than clear water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/054e9c6d4c9e3b39.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the pink fabric at lower left? (A) knitted sweater at center (B) beige knitted sweater at upper right (C) wooden at lower center (D) green grass at lower center" }, { "from": "gpt", "value": "(B) beige knitted sweater at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05ce19039bafe398.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny brown hardwood floor at center below silver metallic radiator at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, shiny brown hardwood floor at center is positioned under silver metallic radiator at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf476079a44288b9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.779, 0.572) (B) (0.429, 0.894)" }, { "from": "gpt", "value": "(A) (0.779, 0.572)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0adca529cab8ad1e.jpg", "conversations": [ { "from": "human", "value": "\nIs clear glass window at center behind dark brown textured couch at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4af31490b5c2c644.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.812, 0.439) (B) (0.492, 0.520)" }, { "from": "gpt", "value": "(A) (0.812, 0.439)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd2d9c48e2bab95d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.370, 0.722) (B) (0.781, 0.923)" }, { "from": "gpt", "value": "(B) (0.781, 0.923)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1b98635d8cb53f0.jpg", "conversations": [ { "from": "human", "value": "\nIs light brown wooden bench at lower center bigger than shiny red car at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a76f7fd82fe96fbe.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown matte duck at upper right is smaller than white matte duckling at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf1ebd3a1b8ebf97.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray cotton t-shirt at left have a lesser width compared to matte white shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, gray cotton t-shirt at left's width is not less than matte white shirt at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36156cc534d9646a.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the blurred people at upper center among (A) brown leather horse at center (B) leather armor at center (C) multicolored fabric at upper right?" }, { "from": "gpt", "value": "(B) leather armor at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a482f2b58b06d5b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black stone sign at center is smaller than satin silver car at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, black stone sign at center occupies less space than satin silver car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed4c589ad69cce94.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grassy at lower center have a lesser width compared to clear wire at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green grassy at lower center's width is less than clear wire at upper center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5806f965a2db3205.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center appear on the left side of green matte tree at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green leafy tree at center is positioned on the left side of green matte tree at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76b36f7d3436dca4.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue tarp-covered couch at lower right appear under shiny black bike at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd097433c5070e13.jpg", "conversations": [ { "from": "human", "value": "\nDoes white silk vestment at center appear on the right side of black cloth at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white silk vestment at center is to the right of black cloth at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c8e35cf7e95972c.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny purple bottle at center have a greater width compared to matte gold foil wine bottle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6801f9bc6b69c4b7.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center positioned before black glossy pig at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is in front of black glossy pig at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec153a42cdc4a5e1.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the pink satin tie at center? Choose from: (A) smooth black hair at center (B) black suit at right (C) matte black suit at center" }, { "from": "gpt", "value": "(B) black suit at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8456cacb25ac3f7f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the gray asphalt highway at center? Select from: (A) metallic silver trailer truck at center (B) american flag painted truck at right" }, { "from": "gpt", "value": "(A) metallic silver trailer truck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18c76cd6b5cd09b4.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the denim/jeans at lower left among (A) green matte shirt at upper center (B) brown stone stairs at center?" }, { "from": "gpt", "value": "(B) brown stone stairs at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc321cdceab9c4aa.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth water at lower center above black plastic smartphone at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49b853c565075e57.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden cutting board at center thinner than raw marbled meat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, wooden cutting board at center is not thinner than raw marbled meat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f071fb7f4bee794.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the rusty rock at right? Select from: (A) smooth gray fish at upper left (B) silvery textured fish at lower center" }, { "from": "gpt", "value": "(B) silvery textured fish at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17e79f69b775083c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.806, 0.958) (B) (0.294, 0.456) (C) (0.364, 0.136)" }, { "from": "gpt", "value": "(C) (0.364, 0.136)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf683e881947e474.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white cotton shirt at upper center (B) orange striped fabric at center (C) orange striped fabric at lower center" }, { "from": "gpt", "value": "(B) orange striped fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4926d58bd02ef461.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte airplane at center is wider than white glossy airplane at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a90b721e93b0cfc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if translucent glass table at center is bigger than translucent glass beer glass at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, translucent glass table at center has a larger size compared to translucent glass beer glass at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b065432e50194c1.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown frothy water at center have a greater width compared to brown textured water at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, brown frothy water at center has a greater width compared to brown textured water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb4f6d0f34cbad66.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte hair at center appear on the right side of blue striped shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find black matte hair at center to the right of blue striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d04812cd179d42f.jpg", "conversations": [ { "from": "human", "value": "\nDoes black fabric pants at lower left have a greater width compared to light purple fabric at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, black fabric pants at lower left has a greater width compared to light purple fabric at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f206b641a1d65dc4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if transparent glass car window at upper left is wider than purple fabric cap at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, transparent glass car window at upper left's width does not surpass purple fabric cap at lower center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42d2bdbb4295d6c0.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) blue cardboard box at center (B) white mesh hat at upper right" }, { "from": "gpt", "value": "(B) white mesh hat at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f80ca2781911da6c.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red wooden house at right have a greater width compared to satin silver car at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a30050318ae936d.jpg", "conversations": [ { "from": "human", "value": "\nIs reflective glass water at lower center below wooden boat at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, reflective glass water at lower center is not below wooden boat at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cde5c1cc6923b1d5.jpg", "conversations": [ { "from": "human", "value": "\nIs gray matte mountain at center bigger than white glossy ferry at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a101eb52285ad33.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of brown grass at center in reference to brown glossy horse at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31d90c78188a1ae3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) white matte blazer at center (B) gold-framed picture at lower left" }, { "from": "gpt", "value": "(A) white matte blazer at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5369e7a6222f494f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) velvet red coat at center (B) dark gray suit at right (C) blue and white fabric flag at upper right" }, { "from": "gpt", "value": "(B) dark gray suit at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71f33fb571717d6f.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden shelves at upper left have a greater width compared to wooden shelf at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, wooden shelves at upper left is wider than wooden shelf at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7bc2ca7089fdc4a4.jpg", "conversations": [ { "from": "human", "value": "\nIs blonde hair at lower left below light blue uniform at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, blonde hair at lower left is not positioned below light blue uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/539a80e6becf1ef7.jpg", "conversations": [ { "from": "human", "value": "\nIs orange striped fabric at right wider than white matte microwave at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa97f0d965f7cd0e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.360, 0.867) (B) (0.767, 0.447)" }, { "from": "gpt", "value": "(A) (0.360, 0.867)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/787a7dd407d4ebdc.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) black satin dress at left (B) green striped shirt at center (C) striped cotton shirt at center (D) cracked concrete path at center" }, { "from": "gpt", "value": "(D) cracked concrete path at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00d7e2f5886a9926.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) striped sweater at center (B) blue plaid shirt at upper center (C) black suit jacket at center (D) floral-patterned dress at upper left" }, { "from": "gpt", "value": "(B) blue plaid shirt at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93a12c85e08c69d2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) red cotton shirt at lower center (B) yellow fabric shirt at lower left" }, { "from": "gpt", "value": "(A) red cotton shirt at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fec6653770e8dac7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.189, 0.400) (B) (0.877, 0.434)" }, { "from": "gpt", "value": "(A) (0.189, 0.400)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1b4be76291eda31.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green uniform students at center and green fabric shirt at center in the image provided, where is green uniform students at center located with respect to green fabric shirt at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f4d50f79fb497e3.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue hijab at center appear under pink sheer hijab at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte blue hijab at center is not positioned below pink sheer hijab at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fa7b25a81638df4.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the matte black suit at left? (A) clear glass wine glass at center (B) clear glass champagne at center (C) matte red sweater at lower right" }, { "from": "gpt", "value": "(C) matte red sweater at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86c4cb1f4b05b579.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear plastic bottle at center is positioned above black wood table at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9d4bb7ca746aa77.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte glass window at upper left appear on the left side of transparent glass door at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte glass window at upper left is to the left of transparent glass door at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3ac11ee5fdb61e4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) gray rough rock at center (B) silhouette figure at center (C) smooth gray rock at right (D) blue cotton shirt at right" }, { "from": "gpt", "value": "(C) smooth gray rock at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a596c866f68ae26.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white grid-patterned building at lower left (B) white glass building at upper left (C) dark blue glass building at lower right (D) transparent glass building at upper right" }, { "from": "gpt", "value": "(B) white glass building at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d826af3b5b58e08d.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic blue car at lower left positioned behind matte silver car at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2d490dec33cadc3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) brown wool coat at right (B) dark brown leather coat at center" }, { "from": "gpt", "value": "(A) brown wool coat at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd55cf49c26e7c9e.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte business suit at center appear under black matte business suit at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, black matte business suit at center is positioned under black matte business suit at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50bae7187e325673.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the red fabric shorts at center? Choose from: (A) white cotton t-shirt at upper right (B) light blue shirt at center" }, { "from": "gpt", "value": "(B) light blue shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce1a7cfff2860d50.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) black matte pants at center (B) denim jacket at left (C) dark brown leather jacket at center (D) dark blue leather jacket at center" }, { "from": "gpt", "value": "(C) dark brown leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e55921cd36a71b7b.jpg", "conversations": [ { "from": "human", "value": "\nDoes green textured sweater at center come behind white textured shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green textured sweater at center is in front of white textured shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce3c03073b3db3ac.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) dark gray jacket at center (B) white fabric bag at center" }, { "from": "gpt", "value": "(A) dark gray jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e72cfc6967983521.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.803, 0.336) (B) (0.229, 0.533) (C) (0.406, 0.473) (D) (0.166, 0.472)" }, { "from": "gpt", "value": "(B) (0.229, 0.533)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/489045df101e9257.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if stone ruins at upper right is positioned above white glossy boat at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, stone ruins at upper right is located above white glossy boat at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06e75a62e93aa0f6.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the black denim shorts at right from the following options: (A) floral print dress at center (B) printed cotton dress at center?" }, { "from": "gpt", "value": "(B) printed cotton dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fee108207d575e5b.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte white tote bag at left appear on the right side of matte red jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte white tote bag at left is not on the right side of matte red jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b37b1a3238dfc89.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black monitor at center is smaller than matte black camera at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black monitor at center is not smaller than matte black camera at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b20f99ef66cdae5.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver metallic car at center have a smaller size compared to matte black sedan at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, silver metallic car at center has a smaller size compared to matte black sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff8110e5ed5df34a.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent glass window at center thinner than wooden table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, transparent glass window at center is not thinner than wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb45e8207d8af8dc.jpg", "conversations": [ { "from": "human", "value": "\nDoes snowy granite mountain range at upper center come in front of black woolly sheep at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e10f552d0b16009f.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center thinner than shiny red electric guitar at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9fd6456e883709bd.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) wooden table at right (B) brown wooden table at center" }, { "from": "gpt", "value": "(B) brown wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e36f141d6221b9de.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte pink blouse at center (B) gold ornate railing at lower right" }, { "from": "gpt", "value": "(B) gold ornate railing at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ffbe1d3a7d7501c.jpg", "conversations": [ { "from": "human", "value": "\nIs brown sandy dirt at center to the left of matte black riding jacket at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, brown sandy dirt at center is not to the left of matte black riding jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/017952040bcbd780.jpg", "conversations": [ { "from": "human", "value": "\nIs gray metallic train track at center bigger than dark gray fabric uniform at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, gray metallic train track at center has a larger size compared to dark gray fabric uniform at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/724f4223518882ec.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) stone arches at center (B) green leafy tree at left (C) green leafy tree at center (D) green textured tree at center" }, { "from": "gpt", "value": "(B) green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d178c2061d4b252d.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton shirt at center closer to camera compared to smooth rock at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e67c7f9be7b03a6e.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white tulle dress at lower center and vibrant floral bouquet at center in the image provided, where is white tulle dress at lower center located with respect to vibrant floral bouquet at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/303625b71992ead6.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the white frothy wave at lower center? (A) green rubber surfboard at center (B) white foam surfboard at center" }, { "from": "gpt", "value": "(A) green rubber surfboard at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f65b5ee3ba53243c.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue matte van at center have a greater width compared to matte black jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, blue matte van at center has a greater width compared to matte black jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/225b16cf882df056.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.359, 0.569) (B) (0.486, 0.633) (C) (0.682, 0.455) (D) (0.057, 0.439)" }, { "from": "gpt", "value": "(D) (0.057, 0.439)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d86e45e4bc6cb7b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) matte red kayak at center (B) smooth water at center (C) green leafy tree at center" }, { "from": "gpt", "value": "(A) matte red kayak at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0128e98de19614d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown sandy beach at lower center is positioned to the left of silhouette hat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, brown sandy beach at lower center is to the right of silhouette hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44a7eaa12918b33c.jpg", "conversations": [ { "from": "human", "value": "\nIs brown grassy shrubs at center further to the viewer compared to brown textured shrub at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of brown textured shrub at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fcdd31599fa87b7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the brushed metal sign at upper left? Select from: (A) black cotton shirt at center (B) black matte shirt at center" }, { "from": "gpt", "value": "(A) black cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70e50a450fcdaeab.jpg", "conversations": [ { "from": "human", "value": "\nIs silhouette group at center further to the viewer compared to dark blue jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/890413d11cf3be4f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.315, 0.733) (B) (0.930, 0.416) (C) (0.549, 0.345)" }, { "from": "gpt", "value": "(C) (0.549, 0.345)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e474de24130f1259.jpg", "conversations": [ { "from": "human", "value": "\nIs purple lace fabric at lower right to the right of wooden table at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find purple lace fabric at lower right to the right of wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8becd0b2f4c07b9c.jpg", "conversations": [ { "from": "human", "value": "\nDoes knitted scarf at lower left appear on the right side of matte black dress at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, knitted scarf at lower left is to the right of matte black dress at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d9a9c043b5ce453.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.611, 0.853) (B) (0.421, 0.781)" }, { "from": "gpt", "value": "(B) (0.421, 0.781)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89559366b65203bd.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown woolen scarf at center is positioned to the right of white matte helmet at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find brown woolen scarf at center to the right of white matte helmet at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c14b911dd0b17f8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) blue cotton shirt at center (B) brushed metal pot at left (C) blue track pants at right (D) white matte plate at center" }, { "from": "gpt", "value": "(D) white matte plate at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cee735ffbd985a7.jpg", "conversations": [ { "from": "human", "value": "\nWhere is brown wooden bench at left located in relation to wooden bench at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdd1c361de4b7643.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange fabric beach chair at center is thinner than matte green deck chair at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, orange fabric beach chair at center has a lesser width compared to matte green deck chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e3567bf3b000396.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the black matte tablet at center from the following options: (A) matte black tablet at center (B) pink striped dress at center?" }, { "from": "gpt", "value": "(A) matte black tablet at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0df150cb817461ee.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is green leafy tree at left located relative to metallic silver car at lower right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b81a61df8f0d0fe0.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown leather vest at right appear over matte black and orange vest at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, brown leather vest at right is not above matte black and orange vest at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d4f607d9a7810b7.jpg", "conversations": [ { "from": "human", "value": "\nIs black denim jeans at left further to camera compared to black plastic video camera at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b83f299e2854fbae.jpg", "conversations": [ { "from": "human", "value": "\nIs matte white shirt at center thinner than plaid skirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte white shirt at center's width is less than plaid skirt at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b523e8254fb779c1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray fabric jacket at center is positioned above red polyester sleeping bag at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, gray fabric jacket at center is above red polyester sleeping bag at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b54959f05e2755a.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of smooth concrete pavement at lower center and light gray fabric at center in the image provided, where is smooth concrete pavement at lower center located with respect to light gray fabric at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/166be280b6143fff.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the bare branches at center among (A) snowy rock mountain range at center (B) silhouette bare branches at left?" }, { "from": "gpt", "value": "(A) snowy rock mountain range at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16842e892c939376.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.215, 0.217) (B) (0.655, 0.402)" }, { "from": "gpt", "value": "(A) (0.215, 0.217)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92668294fd8d1880.jpg", "conversations": [ { "from": "human", "value": "\nIs gray matte jacket at right bigger than green leafy plant at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, gray matte jacket at right is bigger than green leafy plant at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be774eaee8975c52.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is metallic gray pole at center located relative to brown wooden sign at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80576daff5f90c58.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.099, 0.750) (B) (0.548, 0.912) (C) (0.883, 0.584)" }, { "from": "gpt", "value": "(C) (0.883, 0.584)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdc8a26728d12c5d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.208, 0.487) (B) (0.382, 0.542) (C) (0.087, 0.512)" }, { "from": "gpt", "value": "(B) (0.382, 0.542)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e6d655d9540c50f.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent glass table at center have a lesser width compared to translucent plastic bottle at table left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5b32e5059a08361.jpg", "conversations": [ { "from": "human", "value": "\nDoes camouflage fabric uniform at right have a greater width compared to camouflage fabric flag at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of camouflage fabric uniform at right exceeds that of camouflage fabric flag at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/810abf5017ed5329.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue water at lower center is thinner than matte black van at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, blue water at lower center might be wider than matte black van at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e339bc3e8c82d0d6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.823, 0.748) (B) (0.438, 0.278) (C) (0.926, 0.431)" }, { "from": "gpt", "value": "(B) (0.438, 0.278)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aaf4262981b02e38.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black hair at center have a lesser width compared to matte black beanie at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, matte black hair at center might be wider than matte black beanie at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ba5c6751b52d28c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) striped fabric shirt at center (B) black cotton shirt at center" }, { "from": "gpt", "value": "(B) black cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d54ba176e4c2673.jpg", "conversations": [ { "from": "human", "value": "\nIs blue glossy minifigure at center to the right of matte plastic minifigure at left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find blue glossy minifigure at center to the right of matte plastic minifigure at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d7e2afae5a185b6.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) shiny red dress at center (B) white matte shirt at center" }, { "from": "gpt", "value": "(B) white matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04f5d48e0ba31e1b.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of light blue cotton shirt at center and black fabric at upper left in the image provided, where is light blue cotton shirt at center located with respect to black fabric at upper left? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/324276af6a6e5e35.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny black suit at left below yellow printed fabric dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, shiny black suit at left is above yellow printed fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74b0435306789d26.jpg", "conversations": [ { "from": "human", "value": "\nIs blue plaid shorts at center smaller than black plastic bottle at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, blue plaid shorts at center might be larger than black plastic bottle at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/019c8ee235d7df85.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.036, 0.177) (B) (0.368, 0.841) (C) (0.832, 0.875)" }, { "from": "gpt", "value": "(A) (0.036, 0.177)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c3bcc4503f14344.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) weathered wood hut at center (B) smooth wooden structure at center (C) dark brown skin at center, is positioned farthest from the pink fabric at lower right?" }, { "from": "gpt", "value": "(B) smooth wooden structure at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/154abc9594e373b9.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown shaggy horse at lower right appear under white matte horse at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, dark brown shaggy horse at lower right is below white matte horse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c9218e3106effac.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) purple fabric pants at right (B) metallic gate at right (C) black wool coat at center (D) dark blue hoodie at center" }, { "from": "gpt", "value": "(C) black wool coat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/242bd9c87861ffc6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the green leafy palm tree at upper center? Select from: (A) polished bronze statue at center (B) smooth stone pool at center" }, { "from": "gpt", "value": "(B) smooth stone pool at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/724f6855b0e38b18.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the black metallic microphone at upper center? Choose among these: (A) shiny metallic microphone at upper left (B) green wood drum at left (C) wooden drum at center (D) red leather drum at center" }, { "from": "gpt", "value": "(C) wooden drum at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70479c0c6210c6cc.jpg", "conversations": [ { "from": "human", "value": "\nIs black asphalt driveway at lower center positioned at the back of black matte car at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of black matte car at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac33240821bd4e87.jpg", "conversations": [ { "from": "human", "value": "\nIs black wrought iron fence at lower center to the right of black fabric baby carriage at lower left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find black wrought iron fence at lower center to the right of black fabric baby carriage at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2c3910f979d2556.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white matte t-shirt at center in reference to green fabric shorts at left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/872b98b1e79ad1ca.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow metallic crane at upper right to the right of yellow metal crane at right from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, yellow metallic crane at upper right is to the right of yellow metal crane at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25886cd945638d3c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.822, 0.836) (B) (0.272, 0.394)" }, { "from": "gpt", "value": "(B) (0.272, 0.394)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/007a92dfbb92fcd2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green water at river center is positioned below gray cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cca754eb7885fc8.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of blue matte hexagonal stool at lower right in relation to orange matte cube at lower center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc2027027c576620.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue jeans at left appear over black leather jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, blue jeans at left is located above black leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20fa5a4e2841b18b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.628, 0.059) (B) (0.101, 0.637)" }, { "from": "gpt", "value": "(B) (0.101, 0.637)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcb7aded043449e3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the yellow fabric dress at center? (A) gray concrete pavement at center (B) dark blue jeans at lower center (C) pink fabric pants at center" }, { "from": "gpt", "value": "(B) dark blue jeans at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a401f6258e10f185.jpg", "conversations": [ { "from": "human", "value": "\nIs brown tiled roofs at center to the left of smooth gray spire at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown tiled roofs at center is to the left of smooth gray spire at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7284c5a28b6eb5d9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) floral fabric dress at center (B) pink striped onesie at right (C) blue cotton shirt at center, is positioned closest to the matte blue pajamas at left?" }, { "from": "gpt", "value": "(C) blue cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/842bb417647c382a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.183, 0.738) (B) (0.988, 0.498)" }, { "from": "gpt", "value": "(A) (0.183, 0.738)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/226f7f8accb90954.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy exhaust hood at center positioned in front of white marble countertop at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of white marble countertop at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e6391aa298fb1bf.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow fabric at right below multicolored fabric flag at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fd1e5cc07baf89a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.612, 0.303) (B) (0.443, 0.459)" }, { "from": "gpt", "value": "(A) (0.612, 0.303)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7df0928a8d257f37.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte white doll at left is positioned below striped cotton towel at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5f852dbd2c7e4a2.jpg", "conversations": [ { "from": "human", "value": "\nIs cloudy sky at upper center positioned at the back of green leafy mountain at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc251c02a878c8c0.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black phone at center appear on the left side of silver metallic laptop at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, matte black phone at center is positioned on the left side of silver metallic laptop at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f4fb87133ccd466.jpg", "conversations": [ { "from": "human", "value": "\nIs teal cotton shirt at center to the right of smooth brown hair at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find teal cotton shirt at center to the right of smooth brown hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a284fbc674c32f3a.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte face mask at left to the right of white matte tank top at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white matte face mask at left is not on the right side of white matte tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a4815f28e66582d.jpg", "conversations": [ { "from": "human", "value": "\nDoes denim jeans at center have a greater width compared to purple knitted scarf at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9f141140cefc646.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black shirt at center to the left of transparent glass wine glass at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black shirt at center is not to the left of transparent glass wine glass at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ad714e7a9d54f4b.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of green matte t-shirt at center in reference to black matte shirt at left? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a26062ac49ecddc.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the light blue knitted sweater at center-right? Choose from: (A) wooden bench at center (B) smooth concrete bench at center (C) beige concrete pillar at center" }, { "from": "gpt", "value": "(B) smooth concrete bench at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afe55f1a0ff5f3c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) white timber-framed building at center (B) sandy beach at lower left" }, { "from": "gpt", "value": "(A) white timber-framed building at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44eba99ef225a4c4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) brown stone spire at upper center (B) light blue shirt at center (C) striped fabric dress at lower left" }, { "from": "gpt", "value": "(A) brown stone spire at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a63cbaae00fa03d.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of camouflage uniform at center in reference to camouflage paint helicopter at upper center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c970b0a7aa3eccf1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.533, 0.595) (B) (0.796, 0.877) (C) (0.927, 0.927)" }, { "from": "gpt", "value": "(C) (0.927, 0.927)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2cadd6d015344ec.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.435, 0.655) (B) (0.431, 0.598) (C) (0.535, 0.975)" }, { "from": "gpt", "value": "(C) (0.535, 0.975)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8656f55c8b32a5a3.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of smooth gray dome at center in relation to metallic silver car at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a208aa3cb4f4b3cc.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.863, 0.589) (B) (0.447, 0.842) (C) (0.703, 0.306) (D) (0.040, 0.863)" }, { "from": "gpt", "value": "(C) (0.703, 0.306)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4e7d265650e742f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.822, 0.444) (B) (0.640, 0.397) (C) (0.839, 0.950)" }, { "from": "gpt", "value": "(A) (0.822, 0.444)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f05142b65893757.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at center is positioned above maroon fabric tracksuit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green grass at center is positioned over maroon fabric tracksuit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6566ee51e848470.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.671, 0.681) (B) (0.773, 0.684)" }, { "from": "gpt", "value": "(A) (0.671, 0.681)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8514b01dac577f58.jpg", "conversations": [ { "from": "human", "value": "\nDoes white water at center appear under white glossy ferry at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, white water at center is located below white glossy ferry at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1f92fc90fb86b31.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is black matte hot air balloon at center located relative to black matte balloon at left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a89deea6159f7ad1.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of black matte jacket at center and gold metallic glasses at center in the image provided, where is black matte jacket at center located with respect to gold metallic glasses at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00b6d40ca8ad2b1d.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear glass window at center appear on the left side of gold polished statue at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find clear glass window at center to the left of gold polished statue at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73301c097ec0a8b4.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.213, 0.870) (B) (0.266, 0.263) (C) (0.426, 0.433) (D) (0.503, 0.917)" }, { "from": "gpt", "value": "(D) (0.503, 0.917)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e791d0d885ada9d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white misty waterfall at center is thinner than weathered wood sign at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white misty waterfall at center's width is not less than weathered wood sign at lower center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01d42eec2575fac9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.930, 0.641) (B) (0.545, 0.769)" }, { "from": "gpt", "value": "(B) (0.545, 0.769)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f978f573109117e2.jpg", "conversations": [ { "from": "human", "value": "\nIs blue metallic station wagon at center smaller than white plastic license plate at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, blue metallic station wagon at center is not smaller than white plastic license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9bdae04e165b714.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.117, 0.728) (B) (0.480, 0.309)" }, { "from": "gpt", "value": "(A) (0.117, 0.728)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8ed23d575b6017a.jpg", "conversations": [ { "from": "human", "value": "\nIs gray shingles cvs/pharmacy at center wider than silver metallic sedan at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, gray shingles cvs/pharmacy at center is wider than silver metallic sedan at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfe5359ad0ba94ef.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the polished bronze statue at center? Choose from: (A) bronze statue at center (B) slate gray stone pillar at center" }, { "from": "gpt", "value": "(B) slate gray stone pillar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e56c2be14b2a24af.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden planks at lower right is smaller than smooth skin boy at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, wooden planks at lower right is not smaller than smooth skin boy at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f2e93073eca5ad1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) wooden canoe at lower right (B) blue smooth water at center" }, { "from": "gpt", "value": "(B) blue smooth water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7d42288b6bfa68c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue plastic board at center is positioned to the left of black matte tank top at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, blue plastic board at center is not to the left of black matte tank top at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5268e8fa145c0708.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) plaid fabric dress at center (B) black matte book at center (C) black matte tank top at left" }, { "from": "gpt", "value": "(C) black matte tank top at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95e71dbe693ce934.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the glossy plastic gumballs at center? Select from: (A) green translucent gummy rings at center (B) translucent jelly beans at right (C) translucent jelly beans at center" }, { "from": "gpt", "value": "(C) translucent jelly beans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e98d275f3dee4796.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if speckled feathered chick at center-right is smaller than speckled feathered chick at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, speckled feathered chick at center-right is not smaller than speckled feathered chick at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21249aa195ccb4b5.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink fabric dress at upper left appear under white plastic table at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, pink fabric dress at upper left is not below white plastic table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/102490f9af8283b5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) white matte shirt at center (B) red fabric shirt at center (C) blue cotton shirt at upper left" }, { "from": "gpt", "value": "(B) red fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f1c70d634f53fda.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) bare wood tree at center (B) brown grass at center (C) green matte tree at left (D) brown matte tree at left" }, { "from": "gpt", "value": "(C) green matte tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ead297268d139fe.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of white matte dress at center in relation to green cotton shirt at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9d720c61830b335.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white woven hat at center (B) green matte military vehicle at center (C) white cotton pants at lower left" }, { "from": "gpt", "value": "(C) white cotton pants at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b85eb221cb0d0e14.jpg", "conversations": [ { "from": "human", "value": "\nIs matte white dress at center to the left of light pink fabric dress at lower right from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find matte white dress at center to the left of light pink fabric dress at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd50297159cd55b7.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white cotton shirt at center in reference to white cotton tote bag at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b80f6ac36c0a4179.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden at center to the right of white cotton dress at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, wooden at center is positioned on the right side of white cotton dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e47999e17578c723.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) green leafy hillside at right (B) green leafy tree at lower center (C) dark blue water at center" }, { "from": "gpt", "value": "(A) green leafy hillside at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a4080d0f602c4da.jpg", "conversations": [ { "from": "human", "value": "\nIs brown leather jacket at center closer to camera compared to green fabric shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brown leather jacket at center is in front of green fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d9ebabab66808e1.jpg", "conversations": [ { "from": "human", "value": "\nIs blue plastic basket at center below matte brown shellfish at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, blue plastic basket at center is not below matte brown shellfish at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07cc9b5a72fbcf04.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) purple fabric leggings at center (B) red matte sweatshirt at center (C) green fabric shorts at left" }, { "from": "gpt", "value": "(A) purple fabric leggings at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/551680dbf8cfa5a3.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the clear crystal cup at center? (A) crystal clear wine glass at center (B) clear crystal wine glass at center (C) clear crystal shot glass at center" }, { "from": "gpt", "value": "(B) clear crystal wine glass at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/204a655baf3c1fa5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the orange fabric jacket at center? Choose among these: (A) orange matte jacket at center (B) dried mud road at center (C) matte orange jacket at center" }, { "from": "gpt", "value": "(A) orange matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/728095ab206c42d9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy tour bus at center is positioned to the right of light gray fabric pants at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find white glossy tour bus at center to the right of light gray fabric pants at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3eaf46682d8dc48.jpg", "conversations": [ { "from": "human", "value": "\nDoes light brown wooden table at center lie behind wooden chair at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02377993ae75e1c8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) brick paved walkway at center (B) brushed metal boat at center (C) matte concrete water at left" }, { "from": "gpt", "value": "(B) brushed metal boat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19d06db28296c9a5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) golden matte wheat field at center (B) white fluffy cloud at upper center" }, { "from": "gpt", "value": "(A) golden matte wheat field at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e8a8744d5b58579.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is green mossy water at center located relative to green mossy wood stairs at lower right? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e1cb5fd0fa47ad4.jpg", "conversations": [ { "from": "human", "value": "\nIs brown wooden fence at center positioned in front of purple matte jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e56561625103965d.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of wooden desk at center less distant than that of matte black sweater at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b75da4d938db4585.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.480, 0.998) (B) (0.824, 0.477) (C) (0.897, 0.131) (D) (0.530, 0.642)" }, { "from": "gpt", "value": "(C) (0.897, 0.131)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed6b7f7db5f2b589.jpg", "conversations": [ { "from": "human", "value": "\nIs spotted fur dog at center smaller than brown rough bark at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, spotted fur dog at center occupies less space than brown rough bark at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/339e996179d8c576.jpg", "conversations": [ { "from": "human", "value": "\nDoes light brown fabric hat at center have a smaller size compared to brown woven basket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cac42850e89e6750.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the matte bronze statue at center? Choose among these: (A) green patina bronze statue at center (B) dark blue jeans at center (C) light blue shirt at lower center" }, { "from": "gpt", "value": "(B) dark blue jeans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c324ea35f723d26.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) orange matte dump truck at left (B) gray concrete barn at center (C) green leafy hillside at upper center (D) orange matte truck at center" }, { "from": "gpt", "value": "(B) gray concrete barn at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e518c2bda89c7538.jpg", "conversations": [ { "from": "human", "value": "\nIs white smooth shirt at center to the left of yellow plaid shirt at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white smooth shirt at center is positioned on the left side of yellow plaid shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19d625e0cb5e6d42.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) white plastic radiator at upper right (B) white fur dog at center" }, { "from": "gpt", "value": "(A) white plastic radiator at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d97876020652deb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray asphalt pavement at lower left is positioned above light beige pants at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88b2036aa47d7956.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the light yellow fabric shirt at upper left among (A) white cotton shirt at center (B) beige silk shirt at center (C) black plastic microphone at upper right (D) beige silk jacket at center?" }, { "from": "gpt", "value": "(D) beige silk jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d368c19c4dd81fdf.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the white matte jersey at center? Select from: (A) white fabric pants at lower left (B) white matte uniform at center" }, { "from": "gpt", "value": "(B) white matte uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c18c44761e5f114e.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is beige fabric at upper center located relative to white plastic toy at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c8b3f420140594f.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown matte shirt at center appear under brown dirt track at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, brown matte shirt at center is not positioned below brown dirt track at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49f3463a0b7d86ac.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black bottle at center appear on the right side of dark glass bottle at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte black bottle at center is not to the right of dark glass bottle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adba09f28a6ff7ea.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic black keyboard at center is positioned below yellow fabric at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/674030915ffae243.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of dark gray fabric pants at upper center in relation to matte gray shoe at lower center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdb598967fefaef1.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth bark tree at center have a lesser width compared to dark skin/white cloth skirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, smooth bark tree at center is not thinner than dark skin/white cloth skirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87f853989f9301a7.jpg", "conversations": [ { "from": "human", "value": "\nIs soft plush toy at center positioned at the back of matte pink sweater at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of matte pink sweater at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32b17c6c01f179cf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white matte climbing pants at center (B) rusty granite hillside at center (C) green leafy tree at upper right" }, { "from": "gpt", "value": "(A) white matte climbing pants at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2040b1b3c89349d.jpg", "conversations": [ { "from": "human", "value": "\nIs pink satin dress at center to the right of brown matte food at lower center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find pink satin dress at center to the right of brown matte food at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ec9d112ad6122a8.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the matte black suit at center? (A) red silk tie at center (B) white cotton shirt at center (C) matte black hair at center (D) polka dot fabric jacket at left" }, { "from": "gpt", "value": "(B) white cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f457c14846040357.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) white snow at center (B) green matte tree at upper center, is positioned farthest from the dark green textured tree at upper center?" }, { "from": "gpt", "value": "(B) green matte tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc243ef774ca8ee1.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.294, 0.348) (B) (0.744, 0.841) (C) (0.552, 0.820)" }, { "from": "gpt", "value": "(A) (0.294, 0.348)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b44506cd1f7dcd2.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of carved stone sculpture at center more distant than that of polished brass lantern at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8653c5073c47df6f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) silk fabric woman at center (B) dark gray matte horse at center (C) gold textured armor at center" }, { "from": "gpt", "value": "(C) gold textured armor at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18195aa34e68fd48.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte christmas tree at center have a larger size compared to dark brown leather jacket at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green matte christmas tree at center is bigger than dark brown leather jacket at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a3c6ea67f975337.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if natural stone path at center is wider than green leafy tree at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a011726be56334b3.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the clear glass plate at center from the following options: (A) white creamy cake at center (B) golden fried chicken at left?" }, { "from": "gpt", "value": "(B) golden fried chicken at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d55889151c1b9581.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of blue matte bicycle at center and black rubber tire at lower right in the image provided, where is blue matte bicycle at center located with respect to black rubber tire at lower right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8507ff56a58d7f6c.jpg", "conversations": [ { "from": "human", "value": "\nDoes teal fabric pillow at upper left have a lesser width compared to sparkly blue skirt at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, teal fabric pillow at upper left is not thinner than sparkly blue skirt at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fe1e8e5d83fb8ff.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the gray stone column at lower center among (A) white glossy clock at center (B) gray stone column at lower left (C) white marble column at center (D) white marble column at lower center?" }, { "from": "gpt", "value": "(B) gray stone column at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59c7ec88c3ab2ee6.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the knit sweater at center? (A) knitted gray polo neck at center (B) blue fabric curtain at upper left" }, { "from": "gpt", "value": "(A) knitted gray polo neck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/497a93b005693900.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white smooth tower at center located relative to satin blue sedan at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f8cc2cdaadce58d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white matte shirt at center (B) gray fabric shirt at lower left (C) white textured shirt at center (D) red fabric shirt at right" }, { "from": "gpt", "value": "(B) gray fabric shirt at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d551e48c43f426e.jpg", "conversations": [ { "from": "human", "value": "\nIs weathered wood sign at left to the left of wooden at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, weathered wood sign at left is to the left of wooden at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/245962918afd6561.jpg", "conversations": [ { "from": "human", "value": "\nIs black leather collar at left thinner than leather/camel at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, black leather collar at left is not thinner than leather/camel at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/087467a0d944e07a.jpg", "conversations": [ { "from": "human", "value": "\nIs black glossy dresser at left positioned in front of floral fabric dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, black glossy dresser at left is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/300b3c6531eeb10d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.537, 0.778) (B) (0.272, 0.892) (C) (0.780, 0.841) (D) (0.416, 0.792)" }, { "from": "gpt", "value": "(C) (0.780, 0.841)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31244292976eead5.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray curly hair at upper right appear on the right side of black shirt at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, gray curly hair at upper right is not to the right of black shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7999360502ec987.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden water at center above green textured stone wall at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0de3ee9e2aae3750.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the blue fabric tent at center? (A) dark blue synthetic backpack at center (B) brown canvas uniform at center" }, { "from": "gpt", "value": "(A) dark blue synthetic backpack at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2274a906138bde08.jpg", "conversations": [ { "from": "human", "value": "\nIs brown glossy harness at center bigger than matte brown dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4c67f1cd10a64d1.jpg", "conversations": [ { "from": "human", "value": "\nDoes metallic blue car at center appear over blue glossy sedan at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, metallic blue car at center is located above blue glossy sedan at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d7657afdc3684ce.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the white glossy building at center? Choose among these: (A) white glass building at upper center (B) dark blue water at left" }, { "from": "gpt", "value": "(B) dark blue water at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02ef10881655346a.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte skin man at center located relative to brown skin man at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c7e978f3855aebc.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white matte horse at lower right (B) white glossy horse at lower right (C) smooth red shed at center" }, { "from": "gpt", "value": "(C) smooth red shed at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6fa233b3207355ec.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) blue glass building at center (B) green needle-like tree at left (C) blue glass water at center" }, { "from": "gpt", "value": "(B) green needle-like tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9cb5d7cd808f65e.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center have a lesser width compared to green metal gate at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green leafy tree at center's width is not less than green metal gate at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d88bdfbfa120422.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) smooth bark tree at center (B) white plastic sign at center, is positioned farthest from the wooden signpost at center?" }, { "from": "gpt", "value": "(A) smooth bark tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/170bf91ac346dfdd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.548, 0.261) (B) (0.504, 0.317)" }, { "from": "gpt", "value": "(A) (0.548, 0.261)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fedf28edf1d4e724.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of dirt path at center and polished marble obelisk at center in the image provided, where is dirt path at center located with respect to polished marble obelisk at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74b1e2b9845811ce.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the brown matte hair at upper center? Select from: (A) dark green ribbed sweater at center (B) denim jeans at center" }, { "from": "gpt", "value": "(B) denim jeans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/970249fbb868f6e0.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte tree at center appear on the left side of brown dirt track at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, green matte tree at center is to the right of brown dirt track at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5c4ada90019fe0c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.661, 0.775) (B) (0.483, 0.527) (C) (0.302, 0.827)" }, { "from": "gpt", "value": "(C) (0.302, 0.827)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bbf876434633dd33.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) terracotta tiles at center (B) brown tiled roof at lower right" }, { "from": "gpt", "value": "(B) brown tiled roof at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/608a9b0dfdf0a5e4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark green leafy tree at right is positioned to the left of purple dirt track at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, dark green leafy tree at right is not to the left of purple dirt track at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38a29a2b08ad3603.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte orange car at lower center appear on the left side of dark blue dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find matte orange car at lower center to the left of dark blue dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfe3bc4808f53593.jpg", "conversations": [ { "from": "human", "value": "\nIs brown brick houses at upper left closer to the viewer compared to white corrugated metal roof at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0a86c486299b036.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white matte hand at center (B) smooth skin hand at center (C) white paper sign at center right (D) white cotton shirt at center" }, { "from": "gpt", "value": "(D) white cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a626efcce4f0d9e4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the black fabric at lower center? Select from: (A) floral fabric guitar at center (B) zebra-patterned shirt at center" }, { "from": "gpt", "value": "(A) floral fabric guitar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9003d209d35a589a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.600, 0.802) (B) (0.709, 0.388)" }, { "from": "gpt", "value": "(B) (0.709, 0.388)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7884bde177eb24d6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) blue denim shirt at lower center (B) green matte sweater at upper center (C) white matte car at center (D) silver metallic car at left" }, { "from": "gpt", "value": "(A) blue denim shirt at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2536511dad46a24c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.433, 0.700) (B) (0.642, 0.456)" }, { "from": "gpt", "value": "(A) (0.433, 0.700)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1469a5fe6c8e062c.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown bark at right below black smooth tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, dark brown bark at right is positioned under black smooth tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2557be6dd6b972f3.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white soft pillow at center (B) smooth skin baby at center" }, { "from": "gpt", "value": "(B) smooth skin baby at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6848ac2f433bf457.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent glass window at center have a smaller size compared to black granite sink at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7bb86a6db7a6aac.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red striped polo shirt at center is positioned below white jersey at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, red striped polo shirt at center is located below white jersey at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fc5c34e41b287fb.jpg", "conversations": [ { "from": "human", "value": "\nIs white lace dress at center thinner than white sheer veil at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white lace dress at center is not thinner than white sheer veil at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5785755c2b4cc79a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.695, 0.561) (B) (0.328, 0.494)" }, { "from": "gpt", "value": "(B) (0.328, 0.494)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6e049380ea3dc3c.jpg", "conversations": [ { "from": "human", "value": "\nDoes illuminated glass christmas lights at center have a larger size compared to dark brown coat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, illuminated glass christmas lights at center is not larger than dark brown coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/044537e2123183b8.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of snowy rocky mountain at upper left and pink fabric at right in the image provided, where is snowy rocky mountain at upper left located with respect to pink fabric at right? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e65590ce66a0d4e1.jpg", "conversations": [ { "from": "human", "value": "\nDoes black fabric shirt at center come in front of black fur puppy at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9eeeba73eb9b3232.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.705, 0.259) (B) (0.837, 0.719) (C) (0.195, 0.320)" }, { "from": "gpt", "value": "(A) (0.705, 0.259)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f10bfa50755457ad.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.950, 0.327) (B) (0.097, 0.847) (C) (0.510, 0.169)" }, { "from": "gpt", "value": "(B) (0.097, 0.847)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddc8a67b7b92bd86.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink flesh-toned foot at lower right appear on the left side of pink flesh at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, pink flesh-toned foot at lower right is not to the left of pink flesh at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4321720654c82fed.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is cloudy sky at upper center located relative to white fluffy cloud at upper left? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcb6ffd48bd1e697.jpg", "conversations": [ { "from": "human", "value": "\nDoes teal knitted sweater at center appear on the left side of turquoise knitted sweater at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find teal knitted sweater at center to the left of turquoise knitted sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55718fce66e9c889.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) light blue button-down shirt at center (B) brown floral dress at left" }, { "from": "gpt", "value": "(B) brown floral dress at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02b136c4faf5b927.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth sand at center is wider than white matte shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, smooth sand at center has a greater width compared to white matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09a40ce670cfecfc.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown tile roof at center appear on the right side of brown tile roof at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, brown tile roof at center is to the left of brown tile roof at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3af9668de6a751cc.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte white mask at center have a larger size compared to white matte skull at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d264844e185b4bbd.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.694, 0.878) (B) (0.740, 0.822)" }, { "from": "gpt", "value": "(B) (0.740, 0.822)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e72d9830e1f564f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.160, 0.552) (B) (0.273, 0.236)" }, { "from": "gpt", "value": "(A) (0.160, 0.552)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7dbe5551fb5d537e.jpg", "conversations": [ { "from": "human", "value": "\nIs green water at lower left to the right of wooden ship at right from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green water at lower left is not on the right side of wooden ship at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f8b3e5426c454bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.371, 0.469) (B) (0.558, 0.681) (C) (0.715, 0.956)" }, { "from": "gpt", "value": "(B) (0.558, 0.681)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26929d563a28add6.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray ice at center have a larger size compared to snow-covered trees at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, gray ice at center is not larger than snow-covered trees at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1622867ffe3fe725.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.291, 0.817) (B) (0.413, 0.197)" }, { "from": "gpt", "value": "(A) (0.291, 0.817)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d27352116ebfa754.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray suit at center have a smaller size compared to gray matte suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, gray suit at center might be larger than gray matte suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4dfae6d414c88de8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte gray bird at upper center (B) matte gray bird at lower right" }, { "from": "gpt", "value": "(A) matte gray bird at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f192e5881b37ab51.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of rainbow paint face at center in relation to blue matte face paint at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd594c372cc84727.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dark blue textured suit at center (B) dark blue textured tie at center" }, { "from": "gpt", "value": "(B) dark blue textured tie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c88275c9d30c0ef5.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gray shirt at right below light beige shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte gray shirt at right is not positioned below light beige shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2b325de526a4eda.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow matte t-shirt at lower left come behind orange fabric purse at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c4ed1db8d5cbcf9.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte black television at center in relation to puffy brown jacket at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62a272ceb79e5ffa.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray concrete wall at left is thinner than silver metallic trailer truck at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, gray concrete wall at left's width is not less than silver metallic trailer truck at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14e3295fa60b1350.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the green matte bicycle at center among (A) green matte bicycle at left (B) cobblestone pavement at center?" }, { "from": "gpt", "value": "(A) green matte bicycle at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45f486457ef512ca.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown grass at center have a larger size compared to blue cotton polo shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, brown grass at center might be smaller than blue cotton polo shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c93e39ef45e59dd7.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte cap at center wider than white cotton shirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black matte cap at center is not wider than white cotton shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eff6783b3c3d22d7.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear blue water at wave center come behind smooth blue wave at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, clear blue water at wave center is in front of smooth blue wave at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01aa341cc4924e9f.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny red fabric doll at center positioned before velvet-like maroon cape at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, shiny red fabric doll at center is in front of velvet-like maroon cape at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea039c1bcc1fb0f8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.093, 0.094) (B) (0.171, 0.787)" }, { "from": "gpt", "value": "(A) (0.093, 0.094)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea197cb48e5d4c74.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the pink checkered shirt at right among (A) matte green scrubs at center (B) gray fabric shirt at center (C) white cotton socks at lower right?" }, { "from": "gpt", "value": "(C) white cotton socks at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8b9573d2f0a2689.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.651, 0.597) (B) (0.648, 0.294)" }, { "from": "gpt", "value": "(A) (0.651, 0.597)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b64025b162dd328.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) shiny blue sedan at center (B) glossy metallic car at center" }, { "from": "gpt", "value": "(B) glossy metallic car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f82bcc481298388.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.598, 0.570) (B) (0.604, 0.414)" }, { "from": "gpt", "value": "(B) (0.604, 0.414)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50c819194d1a07f1.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown sandy beach at lower left appear on the left side of green fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, brown sandy beach at lower left is positioned on the left side of green fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aab529670c28761d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the white fleece jacket at center? Choose among these: (A) light blue fabric vest at center (B) black metal pole at center" }, { "from": "gpt", "value": "(B) black metal pole at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d7f71d5c5ad49f7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if rocky mountain at upper center is wider than paved stone path at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, rocky mountain at upper center has a greater width compared to paved stone path at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f85bdb2657552c1c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.479, 0.419) (B) (0.586, 0.406)" }, { "from": "gpt", "value": "(B) (0.586, 0.406)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78426788d4c16642.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown textured tree at center is thinner than wooden park bench at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e1f1ccff8730677.jpg", "conversations": [ { "from": "human", "value": "\nIs black plastic keyboard at left positioned behind silver metallic phone at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b649e77a8e96008.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.517, 0.755) (B) (0.198, 0.417) (C) (0.377, 0.498)" }, { "from": "gpt", "value": "(C) (0.377, 0.498)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c4f62a70764bde0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the dark green military uniform at center? Choose among these: (A) black satin dress at left (B) dark gray suit at center (C) white matte dress at center (D) black velvet dress at center" }, { "from": "gpt", "value": "(C) white matte dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37393bfd7e985dae.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) green matte shirt at center (B) matte black laptop at left (C) dark brown suit at center (D) brown textured blazer at center" }, { "from": "gpt", "value": "(D) brown textured blazer at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/106da58245b8b394.jpg", "conversations": [ { "from": "human", "value": "\nWhere is yellow cotton shirt at center located in relation to light blue fabric dress at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7971b028dcac1584.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden swing at center to the right of brown wooden swing at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, wooden swing at center is positioned on the right side of brown wooden swing at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bf88452bf2cc9bd.jpg", "conversations": [ { "from": "human", "value": "\nIs green fabric shirt at center to the right of matte black jacket at right from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green fabric shirt at center is not to the right of matte black jacket at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6710ee03ea03acc.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the light gray fabric shirt at center? Select from: (A) metallic silver motorbike at center (B) metallic silver bicycle at right" }, { "from": "gpt", "value": "(A) metallic silver motorbike at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf789f2dd5746432.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cotton shirt at lower right is positioned above blue jeans at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white cotton shirt at lower right is not positioned above blue jeans at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e3089e21a7fdcaa.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic yellow rickshaw at center closer to camera compared to matte black coach at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of matte black coach at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/616c92047822f6c0.jpg", "conversations": [ { "from": "human", "value": "\nIs translucent fabric at center to the right of white paper at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, translucent fabric at center is positioned on the right side of white paper at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4c0afefccbd99df.jpg", "conversations": [ { "from": "human", "value": "\nIs blue tarpaulin at center wider than yellow matte raincoat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2260e450fac4224e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.455, 0.578) (B) (0.841, 0.722) (C) (0.433, 0.495) (D) (0.669, 0.720)" }, { "from": "gpt", "value": "(C) (0.433, 0.495)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a14c31114789987b.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the clear water at lower left from the following options: (A) white fluffy dog at lower left (B) brown dirt at lower left?" }, { "from": "gpt", "value": "(A) white fluffy dog at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88fb82dc15766930.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the light gray shirt at center? Select from: (A) matte black sunglasses at upper right (B) wooden at center (C) light gray suit at upper right (D) gray wool suit at center" }, { "from": "gpt", "value": "(A) matte black sunglasses at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb02381b1ad995cb.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the white stone fountain at center? (A) black puffy jacket at left (B) green mossy stone fountain at center" }, { "from": "gpt", "value": "(A) black puffy jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/793f66634a2d0459.jpg", "conversations": [ { "from": "human", "value": "\nIs weathered brown wood at lower left further to the viewer compared to green wood tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of green wood tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac06eb456aec5690.jpg", "conversations": [ { "from": "human", "value": "\nDoes floral fabric dress at center come in front of matte black shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, floral fabric dress at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ee9d8292126a906.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of matte blue dress at center less distant than that of matte blue fabric hand at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte blue dress at center is in front of matte blue fabric hand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a346ec46dc0582eb.jpg", "conversations": [ { "from": "human", "value": "\nDoes green woolen jacket at lower right lie behind white woolly sheep at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a009fdd8a3413fb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if glassy silver skyscraper at center is positioned to the right of blue glossy monorail at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, glassy silver skyscraper at center is to the right of blue glossy monorail at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2809f0f400521b86.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.305, 0.819) (B) (0.234, 0.073) (C) (0.492, 0.381)" }, { "from": "gpt", "value": "(A) (0.305, 0.819)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8dff842f0172fcb.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) clear glass window at upper left (B) white marble statue at center (C) clear crystal chandelier at upper left" }, { "from": "gpt", "value": "(A) clear glass window at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96d15c5129e72222.jpg", "conversations": [ { "from": "human", "value": "\nIs charcoal gray stone fireplace at right wider than gray matte sweater at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6c7e06c17e3cea8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) rusty stone castle at center (B) white plastic boat at lower center" }, { "from": "gpt", "value": "(B) white plastic boat at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02f0cd420e803ad0.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) black glossy dog at center (B) clear ice at center" }, { "from": "gpt", "value": "(A) black glossy dog at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4cfd7de7d3cf07e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte black suit at center (B) black matte jacket at center" }, { "from": "gpt", "value": "(B) black matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23749bf5fa25632d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray cotton t-shirt at center is positioned below white shirt at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, gray cotton t-shirt at center is located below white shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42674313e6dbd86f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.951, 0.391) (B) (0.775, 0.641) (C) (0.878, 0.369)" }, { "from": "gpt", "value": "(C) (0.878, 0.369)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/baaca1309c67f4da.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the white soft paw at lower left? (A) black matte paw at lower center (B) black shiny dog at center" }, { "from": "gpt", "value": "(A) black matte paw at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be744da9eab166a2.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the blue water at upper left among (A) curly orange hair at center (B) gray matte hair at center (C) striped cotton shirt at center?" }, { "from": "gpt", "value": "(A) curly orange hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0c164b932215801.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the dark blue sweater at center? Select from: (A) black leather jacket at center (B) matte black jacket at center (C) silver metallic train at center" }, { "from": "gpt", "value": "(A) black leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/125e8a0e72071fc1.jpg", "conversations": [ { "from": "human", "value": "\nIs red fabric umbrella at center bigger than multicolored balloons at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24d8b566a4462ef4.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red sweater at center thinner than blonde hair at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37ef75e12ab385a8.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the metallic digital clock at center among (A) dark blue suit at center (B) dark brown leather jacket at center?" }, { "from": "gpt", "value": "(B) dark brown leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d092e7c67640bc24.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) rocky stone structure at center (B) rustic stone mountain at upper center" }, { "from": "gpt", "value": "(A) rocky stone structure at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/087323220d989aa0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.508, 0.662) (B) (0.648, 0.547) (C) (0.408, 0.838) (D) (0.140, 0.720)" }, { "from": "gpt", "value": "(C) (0.408, 0.838)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/013f54b09713e516.jpg", "conversations": [ { "from": "human", "value": "\nIs gold polished statue at center smaller than dark brown fabric pants at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, gold polished statue at center occupies less space than dark brown fabric pants at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47e01a905b08fff7.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of dark blue hard hat at center in reference to gray fabric shirt at lower left? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/393a1ffbee10bda8.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden houseboat at left positioned behind white matte boat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, wooden houseboat at left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d699211c7f395667.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center above green canvas tent at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green grass at center is not above green canvas tent at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f7c6cdcaa997c4a.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the snowy rock mountain at upper right among (A) dark gray fabric bicycle at center (B) silver metallic mountain bike at center (C) rugged stone terrain at center?" }, { "from": "gpt", "value": "(C) rugged stone terrain at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72a4f3e2529ba838.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the white cotton shirt at center? Choose among these: (A) dark gray pants at left (B) matte black microphone at left (C) checkered fabric shirt at center" }, { "from": "gpt", "value": "(C) checkered fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b74b6e2e3eda6e4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) gray fabric suit at left (B) white shirt at center, is positioned farthest from the black leather coat at center?" }, { "from": "gpt", "value": "(A) gray fabric suit at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f8b4757d16c40b1.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) gold glass building at center (B) white frothy water at lower left" }, { "from": "gpt", "value": "(B) white frothy water at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9479bef9ae85e1a0.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny silver fish at upper left appear on the right side of shiny silver fish at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, shiny silver fish at upper left is not to the right of shiny silver fish at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bceffe11d14e6f2e.jpg", "conversations": [ { "from": "human", "value": "\nIs white glass building at left thinner than beige textured building at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white glass building at left is not thinner than beige textured building at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/369cfeb78052c6df.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) black fabric uniform at center (B) navy blue fabric uniform at center, is positioned closest to the metallic gray ship at upper right?" }, { "from": "gpt", "value": "(B) navy blue fabric uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20c91ef3f82735d9.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny blue water at center have a larger size compared to dark green leafy branch at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, shiny blue water at center might be smaller than dark green leafy branch at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/800d84503169d769.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light blue cotton pants at right is thinner than white cotton pants at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, light blue cotton pants at right has a lesser width compared to white cotton pants at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2f94594503cbb7b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the dark hair at right? Select from: (A) yellow digital sign at center (B) yellow digital display at center (C) dark brown hair at center (D) yellow digital sign at upper left" }, { "from": "gpt", "value": "(D) yellow digital sign at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a4fa34c9073f249.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the gray/granite rock at center? Select from: (A) pink dotted cardigan at center (B) gray wool sweater at center" }, { "from": "gpt", "value": "(B) gray wool sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9f35aeb7bd0981a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.327, 0.895) (B) (0.873, 0.694)" }, { "from": "gpt", "value": "(B) (0.873, 0.694)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1511e82422eb6948.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy train at center is positioned to the right of dark purple fabric shirt at center-right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white glossy train at center is not to the right of dark purple fabric shirt at center-right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6816f0e8b0b28c3c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) pink matte shirt at center (B) shiny black sunglasses at upper right" }, { "from": "gpt", "value": "(B) shiny black sunglasses at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc8383fc1efea523.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.887, 0.478) (B) (0.564, 0.848) (C) (0.143, 0.742)" }, { "from": "gpt", "value": "(C) (0.143, 0.742)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d04edf6dbd65298.jpg", "conversations": [ { "from": "human", "value": "\nDoes purple matte smoothie at right appear on the right side of smooth white milkshake at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find purple matte smoothie at right to the right of smooth white milkshake at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0773295181aef54.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white matte laptop at lower left (B) black textured scarf at center (C) matte gray sweater at center (D) matte black shirt at center" }, { "from": "gpt", "value": "(C) matte gray sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5db7fedaf213f586.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue plastic sign at center is positioned to the right of white glossy car at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, blue plastic sign at center is not on the right side of white glossy car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c0315e5da3c4758.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange lace top at left appear on the left side of orange lace tank top at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, orange lace top at left is to the left of orange lace tank top at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0939f001edc5cce.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center appear on the left side of white matte dome at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find green leafy tree at center to the left of white matte dome at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/879cff38dc4ad69e.jpg", "conversations": [ { "from": "human", "value": "\nDoes soft yellow plush toy at center appear on the left side of blue matte pole at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find soft yellow plush toy at center to the left of blue matte pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46620e66f1287fd5.jpg", "conversations": [ { "from": "human", "value": "\nDoes black fur coat at left have a lesser width compared to black plastic sunglasses at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black fur coat at left is not thinner than black plastic sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52c9d51cdcf0847a.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped sweater at left appear on the right side of wooden at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, striped sweater at left is to the left of wooden at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fc4bdfbf81f890e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte motorcycle at center is positioned above metallic maroon sedan at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black matte motorcycle at center is above metallic maroon sedan at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1fcdb8677d944b98.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black fuzzy socks at center is positioned above matte black socks with pink dots at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c6447f2e03db08e.jpg", "conversations": [ { "from": "human", "value": "\nIs white fabric table at center closer to camera compared to white tablecloth at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ba845ada778cf51.jpg", "conversations": [ { "from": "human", "value": "\nIs dark blue dress at center closer to camera compared to smooth skin hand at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23058f618df3ee35.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) green leafy tree at left (B) clear water at center" }, { "from": "gpt", "value": "(B) clear water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57cfbc9187a2e7fc.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) brick building at center (B) satin silver sedan at center-right (C) shiny chrome motorcycle at lower left" }, { "from": "gpt", "value": "(C) shiny chrome motorcycle at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/994549cc149123a1.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the white cotton shirt at center among (A) concrete rectangular hole at center (B) black matte crack at lower center?" }, { "from": "gpt", "value": "(B) black matte crack at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3dd4a99557e03f5a.jpg", "conversations": [ { "from": "human", "value": "\nDoes white cotton shirt at left have a smaller size compared to white cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white cotton shirt at left is not smaller in size than white cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0150b4a6094b27f8.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black shirt at center to the right of floral-patterned fabric dress at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, matte black shirt at center is positioned on the right side of floral-patterned fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66b215163915c9a6.jpg", "conversations": [ { "from": "human", "value": "\nIs gray rocky mountain at upper center in front of brown rough stone at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ccdc0d8c3169908.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth concrete stairs at lower center is bigger than black matte speaker at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, smooth concrete stairs at lower center is bigger than black matte speaker at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/933e33622c95c354.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue water at lower center come in front of brown stone church at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb0c66b209b82d1a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.708, 0.672) (B) (0.539, 0.341)" }, { "from": "gpt", "value": "(A) (0.708, 0.672)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9238d4cf141512fb.jpg", "conversations": [ { "from": "human", "value": "\nIs glossy blue jet ski at center smaller than matte black jet ski at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, glossy blue jet ski at center is not smaller than matte black jet ski at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/581dcd88f16b004e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown soft hoodie at center is smaller than matte black jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brown soft hoodie at center is smaller than matte black jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/955fa27232b20fae.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the brown wooden tree at upper left? Choose from: (A) green leafy tree at upper right (B) wooden log cabin at center (C) green leafy tree at center" }, { "from": "gpt", "value": "(A) green leafy tree at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70e5b48ca55df6a5.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic silver bike lane at center above teal matte bus at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, metallic silver bike lane at center is below teal matte bus at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a46606efafc26749.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow dotted sweater at center appear on the left side of brown textured sweater at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, yellow dotted sweater at center is not on the left side of brown textured sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bc58c2039738784.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny satin dress at left thinner than matte red dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, shiny satin dress at left's width is not less than matte red dress at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc07776a4bb7b264.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of smooth concrete pavement at center and green matte shirt at upper left in the image provided, where is smooth concrete pavement at center located with respect to green matte shirt at upper left? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3e02422bbd326cc.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green leafy vegetable at center in relation to translucent glass wine at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2b04b2c33b705bc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.053, 0.422) (B) (0.632, 0.522)" }, { "from": "gpt", "value": "(A) (0.053, 0.422)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ee6d836ec8e0980.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.226, 0.373) (B) (0.581, 0.580)" }, { "from": "gpt", "value": "(B) (0.581, 0.580)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5144392deb3f5e79.jpg", "conversations": [ { "from": "human", "value": "\nIs reflective safety vest at center positioned before orange safety vest at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of orange safety vest at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca0e5914a7a5bd76.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) yellow fuzzy coat at upper right (B) dark gray hoodie at lower center (C) dark blue jacket at upper right (D) dark gray jacket at lower left, is positioned closest to the black matte jacket at center?" }, { "from": "gpt", "value": "(C) dark blue jacket at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef3168fbf088ff0e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green leafy tree at upper right (B) clear water at center (C) green leafy tree at left" }, { "from": "gpt", "value": "(A) green leafy tree at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/041e66dc8170bdff.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) light blue cotton shirt at lower left (B) matte red shirt at center (C) matte red t-shirt at center" }, { "from": "gpt", "value": "(A) light blue cotton shirt at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66025c98e6e69745.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray shirt at center appear on the left side of matte black shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find dark gray shirt at center to the left of matte black shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/931383bddf7dee74.jpg", "conversations": [ { "from": "human", "value": "\nIs purple matte shirt at center thinner than white matte dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, purple matte shirt at center's width is not less than white matte dress at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/217416a9c82316b7.jpg", "conversations": [ { "from": "human", "value": "\nIs gray fabric chair at center smaller than transparent glass window at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, gray fabric chair at center occupies less space than transparent glass window at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c4a16e95488d4a4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the brown dirt track at center? Select from: (A) white matte shirt at center (B) yellow matte building at left (C) rustic wooden hut at center" }, { "from": "gpt", "value": "(B) yellow matte building at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca250a17aff47950.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth rock creek at lower left further to the viewer compared to rusty brown rock at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb9103c108825998.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.493, 0.622) (B) (0.610, 0.787)" }, { "from": "gpt", "value": "(B) (0.610, 0.787)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d51d23d81a3ede34.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the metallic red car at center from the following options: (A) metallic silver car at lower left (B) metallic structure at center?" }, { "from": "gpt", "value": "(B) metallic structure at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93685a375ea033c8.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte green jacket at left have a larger size compared to olive green hoodie at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte green jacket at left is bigger than olive green hoodie at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e9fe16607b6d6f8.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the white plastic table at center? (A) black matte uniform at upper right (B) black matte uniform at center (C) black smooth uniform at center" }, { "from": "gpt", "value": "(A) black matte uniform at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09ee9fc97187e755.jpg", "conversations": [ { "from": "human", "value": "\nIs dry straw at lower center positioned before striped fur kitten at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, dry straw at lower center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1012f459e956a0b7.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the matte white book at center? Choose from: (A) woven brown basket at left (B) hardcover book at center" }, { "from": "gpt", "value": "(B) hardcover book at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96f7e102a249c47a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.312, 0.873) (B) (0.965, 0.089) (C) (0.169, 0.698)" }, { "from": "gpt", "value": "(A) (0.312, 0.873)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70705e42b4d2ae7a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green leafy tree at center (B) shiny chrome motorcycle at lower right (C) green matte shirt at center" }, { "from": "gpt", "value": "(A) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d2a16b3b4e9c145.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) satin blue dress at center (B) shiny black suit at center" }, { "from": "gpt", "value": "(B) shiny black suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d20566587eb10dd.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.601, 0.461) (B) (0.160, 0.927)" }, { "from": "gpt", "value": "(A) (0.601, 0.461)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cdd940886ca973a7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte drum at center is positioned below printed fabric drumstick at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white matte drum at center is not positioned below printed fabric drumstick at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/684e627ed5969485.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) white smooth neck at center (B) white matte bird at center" }, { "from": "gpt", "value": "(B) white matte bird at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94aa3080e3c3c096.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) gray cotton sweatshirt at center (B) denim at left" }, { "from": "gpt", "value": "(B) denim at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b0d32ca87b80453.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.501, 0.483) (B) (0.533, 0.742)" }, { "from": "gpt", "value": "(A) (0.501, 0.483)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a74f7cdfb3c9a10.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.351, 0.866) (B) (0.071, 0.398) (C) (0.431, 0.942) (D) (0.859, 0.623)" }, { "from": "gpt", "value": "(D) (0.859, 0.623)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97ea8b27a6b49f78.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden beads necklace at center below matte stone head at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, wooden beads necklace at center is located below matte stone head at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00112e1d6c62af6b.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth blue shirt at center positioned behind yellow matte figure at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, smooth blue shirt at center is further from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d957664870ddd918.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is brown matte insects at center located relative to matte brown insect at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/034278c60c8e4229.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of matte brown sweater at center and black matte shirt at center in the image provided, where is matte brown sweater at center located with respect to black matte shirt at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e3787ec37abf159.jpg", "conversations": [ { "from": "human", "value": "\nWhere is blue cotton saree at right located in relation to maroon sheer shawl at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a1eeac5d99d770a.jpg", "conversations": [ { "from": "human", "value": "\nDoes greenish water at lower left appear on the right side of tan skin man at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, greenish water at lower left is not on the right side of tan skin man at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2701cf620e302f3c.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the blue tie-dye shirt at upper right among (A) curly red hair at lower right (B) blue tie-dye shirt at center (C) blue tie-dye shirt at upper center?" }, { "from": "gpt", "value": "(A) curly red hair at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec6c7f1d5f87b68a.jpg", "conversations": [ { "from": "human", "value": "\nIs cloudy sky at upper center below glossy reflective water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, cloudy sky at upper center is not positioned below glossy reflective water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c85ca2381b175bf.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent blue water at center below white matte boat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, transparent blue water at center is positioned under white matte boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9266228dd31e3328.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) green leafy tree at center (B) green grassy field at center" }, { "from": "gpt", "value": "(A) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0585774f37ebb1cc.jpg", "conversations": [ { "from": "human", "value": "\nIs silver metallic train at center thinner than shiny glass tower at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, silver metallic train at center's width is less than shiny glass tower at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7a3dc42aede06a7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.795, 0.622) (B) (0.418, 0.911) (C) (0.445, 0.825)" }, { "from": "gpt", "value": "(A) (0.795, 0.622)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/832a8f3a6e0ddf85.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny black shell at center is thinner than shiny dark brown bowl at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, shiny black shell at center has a lesser width compared to shiny dark brown bowl at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4339ca280790a9b9.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny black car at lower left lie in front of metallic silver car at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc65c4642b4802c8.jpg", "conversations": [ { "from": "human", "value": "\nIs brown/camouflage tree at center wider than wooden rifle at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6267a9ae27618125.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte scuba gear at center come in front of white glossy boat at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fcb183566afa2c3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if bronze statue at upper center is positioned to the left of polished stone statue at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, bronze statue at upper center is to the left of polished stone statue at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7028a5a1371b6479.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the black fabric coat at center? (A) shiny metallic bicycle at upper center (B) plaid flannel shirt at center" }, { "from": "gpt", "value": "(B) plaid flannel shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65e21b580dcff0f4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown glazed vase at left is positioned to the left of terracotta clay pot at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brown glazed vase at left is to the left of terracotta clay pot at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7012083ea35f8f7c.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth skin face at upper right have a lesser width compared to smooth beige baby at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, smooth skin face at upper right is thinner than smooth beige baby at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/daf82e4b6179eb27.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown smooth river at center appear under green plastic boat at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06dff253d23049ee.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the dark gray jacket at lower left? Select from: (A) dark blue jeans at center (B) light brown fabric jacket at lower left (C) red backpack at center" }, { "from": "gpt", "value": "(C) red backpack at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d88def7747956525.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte stone statue at right lie behind shiny black dog at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f830d6c319ffa70e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) green leafy tree at center (B) brown muddy water at center (C) dirt path at center" }, { "from": "gpt", "value": "(C) dirt path at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d0f983f2f28f0fb.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue beaded necklace at upper center have a larger size compared to blue fabric at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, blue beaded necklace at upper center has a larger size compared to blue fabric at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56aa41c80350a905.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.059, 0.552) (B) (0.555, 0.431) (C) (0.721, 0.427) (D) (0.766, 0.775)" }, { "from": "gpt", "value": "(C) (0.721, 0.427)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49a603de4b54f768.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.197, 0.834) (B) (0.404, 0.944) (C) (0.363, 0.534)" }, { "from": "gpt", "value": "(B) (0.404, 0.944)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f25d966f91ac0e9e.jpg", "conversations": [ { "from": "human", "value": "\nIs green needle-like tree at lower left further to the viewer compared to green leafy tree at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e989232e7063722.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white fluffy scrambled eggs at lower left (B) black plastic keyboard at upper left" }, { "from": "gpt", "value": "(B) black plastic keyboard at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f66e25c7391fbe35.jpg", "conversations": [ { "from": "human", "value": "\nDoes natural wood toy at center appear on the right side of natural wood chest at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, natural wood toy at center is positioned on the right side of natural wood chest at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0530fdfdff5bda1b.jpg", "conversations": [ { "from": "human", "value": "\nIs natural wood pallet at upper center wider than natural wood pallet at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/baefb68bf4e8d8f6.jpg", "conversations": [ { "from": "human", "value": "\nIs green textured mountain range at center smaller than green leafy tree at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, green textured mountain range at center might be larger than green leafy tree at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6f38154a93702eb.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown rough gravel at center lie behind teal matte suv at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of teal matte suv at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/523b88c1044a1a91.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny black fur at right is smaller than white painted wood bench at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, shiny black fur at right might be larger than white painted wood bench at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95c1134d73ef7a31.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) brick textured building at left (B) white textured building at center" }, { "from": "gpt", "value": "(A) brick textured building at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc1929ab9c62e0aa.jpg", "conversations": [ { "from": "human", "value": "\nDoes white cotton pants at center have a greater width compared to blue cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white cotton pants at center is not wider than blue cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e987743ef8a7654.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of dark gray t-shirt at left in reference to white cotton shirt at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92f63e8242436678.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is asphalt road at center located relative to dark blue fabric at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4aa752b128ec765c.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the shiny black sedan at lower left from the following options: (A) gray asphalt parking lot at lower left (B) shiny black sedan at center?" }, { "from": "gpt", "value": "(B) shiny black sedan at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/740123a0644b41d2.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the shiny gold vest at center among (A) satin dress at left (B) pink satin gown at center (C) white satin dress at center (D) purple satin dress at right?" }, { "from": "gpt", "value": "(B) pink satin gown at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9140ec82042140a0.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte khaki jeep at center located relative to yellow matte license plate at rear? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0a7bef065055d4e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white paper cup at center (B) black matte t-shirt at center (C) sunglasses at center (D) white cotton polo shirt at left" }, { "from": "gpt", "value": "(C) sunglasses at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11215755b25e226d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if concrete road at center is wider than white plastic circle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of concrete road at center exceeds that of white plastic circle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2add6caf9497aa7f.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the denim jacket at upper center? Choose from: (A) ribbed knit sweater at left (B) multicolored painted dolls at center" }, { "from": "gpt", "value": "(A) ribbed knit sweater at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13f68df929b36a2b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.510, 0.794) (B) (0.298, 0.478)" }, { "from": "gpt", "value": "(B) (0.298, 0.478)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc79d6631cd30d68.jpg", "conversations": [ { "from": "human", "value": "\nDoes concrete sidewalk at center have a larger size compared to floral dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06045da85463cddb.jpg", "conversations": [ { "from": "human", "value": "\nIs white fluffy cloud at upper center thinner than brown plastic glasses at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white fluffy cloud at upper center's width is not less than brown plastic glasses at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e3c23dd5d115018.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny blue train at upper right lie behind matte blue train at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c8709571f4be188.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue fleece jacket at left is smaller than wooden stairs at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, blue fleece jacket at left has a smaller size compared to wooden stairs at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cfea3b8058c30c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.710, 0.416) (B) (0.706, 0.378)" }, { "from": "gpt", "value": "(A) (0.710, 0.416)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba1b23f79663f810.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the gray concrete skyscraper at right? (A) matte glass building at center (B) glossy glass skyscraper at center (C) glossy glass tower at center (D) black glass building at center" }, { "from": "gpt", "value": "(A) matte glass building at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eca9576a94442a19.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte snow at center is positioned to the left of matte red vest at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find white matte snow at center to the left of matte red vest at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1db65b4849b4e70.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at center is smaller than matte red baseball caps at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green grass at center occupies less space than matte red baseball caps at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa355f1183205f9d.jpg", "conversations": [ { "from": "human", "value": "\nIs purple translucent cup at center closer to camera compared to wooden picnic table at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af81ab46e2bade23.jpg", "conversations": [ { "from": "human", "value": "\nIs brown muddy water at center behind green mossy tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brown muddy water at center is behind green mossy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5cc60ab6d03b804b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the blue fabric shirt at center? (A) white glossy car at lower right (B) beige matte bus at center" }, { "from": "gpt", "value": "(A) white glossy car at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d4eef248a3746eb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.501, 0.769) (B) (0.885, 0.119)" }, { "from": "gpt", "value": "(A) (0.501, 0.769)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ba4f635ab49afaf.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent glass street light at center to the right of polished glass pole at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, transparent glass street light at center is to the left of polished glass pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d93c0c3091de8561.jpg", "conversations": [ { "from": "human", "value": "\nIs red fleece sweatshirt at center to the left of gray matte shirt at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, red fleece sweatshirt at center is to the right of gray matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96e143024d602fa5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) transparent water at center (B) matte pink flamingo at center" }, { "from": "gpt", "value": "(A) transparent water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcf4b085fb145f29.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the striped cotton shirt at center? Choose from: (A) brown fabric baseball cap at upper left (B) brown cap at center (C) bearded man at center" }, { "from": "gpt", "value": "(B) brown cap at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31c62373dcaf3a97.jpg", "conversations": [ { "from": "human", "value": "\nDoes white dotted shirt at center have a larger size compared to green fabric tent at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, white dotted shirt at center might be smaller than green fabric tent at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/088368b5b1e7149e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny blue car at center is smaller than light brown leather jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, shiny blue car at center might be larger than light brown leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c792dd354907e6c4.jpg", "conversations": [ { "from": "human", "value": "\nDoes black pinstripe suit at center have a larger size compared to black satin bow tie at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, black pinstripe suit at center is larger in size than black satin bow tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1696241b8916df8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) steampunk-patterned book cover at right (B) matte paper book cover at center" }, { "from": "gpt", "value": "(B) matte paper book cover at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/341b0abe30cdb2da.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton bath towel at upper center to the right of white soft towel at left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white cotton bath towel at upper center is positioned on the right side of white soft towel at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d73eaaebf13dc60.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) green matte suit at center (B) matte black projector at upper center (C) white matte projector screen at upper center (D) wooden table at lower center, is positioned farthest from the metallic silver table at lower right?" }, { "from": "gpt", "value": "(C) white matte projector screen at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f20dd565fcff5fdd.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray cotton shirt at upper right appear on the right side of pink fabric shirt at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, gray cotton shirt at upper right is positioned on the right side of pink fabric shirt at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5cce24c8f04d4430.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) blue cotton shirt at center (B) matte red canopy at upper left" }, { "from": "gpt", "value": "(B) matte red canopy at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8c0977f149df4f9.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the brown leather seat at center? (A) matte brown chair at center (B) metallic gray seat at center" }, { "from": "gpt", "value": "(B) metallic gray seat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc73aa52675ab25e.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy train at center have a lesser width compared to white glossy train at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39e38da0b9f035f7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green mossy tree at center is bigger than blue fabric backpack at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green mossy tree at center is not larger than blue fabric backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/269d7ee6e66c16ba.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte forest at center is wider than green matte tree at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green matte forest at center has a greater width compared to green matte tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f0bc124a395e85d.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of brown rough rock at center in relation to shiny black shorts at left? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89d2be86c652c6a0.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte silver dress at center have a smaller size compared to yellow spandex tights at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte silver dress at center is not smaller in size than yellow spandex tights at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82f870fe41db7d73.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear water at rock bottom is bigger than gray rough rock at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, clear water at rock bottom has a larger size compared to gray rough rock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85591f5ebe83bfb6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black glove at upper center is positioned below reflective plastic goggles at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da2c65582a599a46.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth concrete pavement at lower center positioned at the back of black canvas shoe at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, smooth concrete pavement at lower center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a647fb651187e33c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny red car at right is positioned to the left of white glossy car at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, shiny red car at right is positioned on the left side of white glossy car at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f3c424f832acab9.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) green leafy bush at center (B) green textured bush at lower right (C) green leafy tree at left (D) green leafy bush at lower right" }, { "from": "gpt", "value": "(D) green leafy bush at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc89de367a20f16a.jpg", "conversations": [ { "from": "human", "value": "\nIs white paper sign at center right above black textured lamp post at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white paper sign at center right is not positioned above black textured lamp post at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3976c1f4092515ae.jpg", "conversations": [ { "from": "human", "value": "\nIs navy blue fleece at center to the left of green leafy hill at upper right from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, navy blue fleece at center is positioned on the left side of green leafy hill at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a387280d3ddff8c3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if cracked stone head at center is wider than cracked stone face at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of cracked stone head at center exceeds that of cracked stone face at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef984d2b237ef97e.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte khaki shirt at center lie behind black wood bookshelf at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte khaki shirt at center is in front of black wood bookshelf at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5c1d8b81c2a2d8f.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of smooth brown rock at center more distant than that of brown matte rock at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e723229a914c8072.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) gold polished spear at center (B) green patina bronze statue at center" }, { "from": "gpt", "value": "(B) green patina bronze statue at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/630326030c5dd634.jpg", "conversations": [ { "from": "human", "value": "\nIs matte purple nail polish at center above satin purple nail polish at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte purple nail polish at center is above satin purple nail polish at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6576fea029e60da.jpg", "conversations": [ { "from": "human", "value": "\nIs red brick wall at upper right positioned behind reddish-brown brick pillar at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/956102235c0c357a.jpg", "conversations": [ { "from": "human", "value": "\nIs clear water at lower center further to camera compared to red matte swimsuit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a2fa1c772abd74b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) shiny satin gloves at upper right (B) pink silky wig at upper left, is positioned farthest from the shiny pink wig at center?" }, { "from": "gpt", "value": "(A) shiny satin gloves at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/660e93d0c3d0e7a8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear blue water at center is thinner than smooth skin girl at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, clear blue water at center is not thinner than smooth skin girl at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ce2e9b1b0beef25.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.366, 0.383) (B) (0.647, 0.508) (C) (0.618, 0.267)" }, { "from": "gpt", "value": "(B) (0.647, 0.508)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86bbe3a80c1357cb.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black folding chair at left wider than black fabric chair at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of matte black folding chair at left exceeds that of black fabric chair at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83735fcb43d84ad2.jpg", "conversations": [ { "from": "human", "value": "\nIs black polished vintage car at center thinner than white satin dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, black polished vintage car at center is not thinner than white satin dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f10e72893479e745.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.222, 0.714) (B) (0.883, 0.377)" }, { "from": "gpt", "value": "(A) (0.222, 0.714)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10d66c651df2bdd7.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden at center thinner than white cotton dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, wooden at center is not thinner than white cotton dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a3c94f9c5d893fd.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth skin face at center have a smaller size compared to nail polish at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, smooth skin face at center might be larger than nail polish at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11ff53e0da78c978.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.639, 0.680) (B) (0.539, 0.072) (C) (0.366, 0.909) (D) (0.098, 0.497)" }, { "from": "gpt", "value": "(D) (0.098, 0.497)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c51ed24400577aff.jpg", "conversations": [ { "from": "human", "value": "\nIs satin pink coat at center further to camera compared to satin pink dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of satin pink dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f63bbb0a90834219.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden-framed window at center closer to the viewer compared to clear glass window at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1baa29299bfe44d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) dark fabric umbrella at upper right (B) black matte umbrella at upper center" }, { "from": "gpt", "value": "(B) black matte umbrella at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d52df0e035e25136.jpg", "conversations": [ { "from": "human", "value": "\nIs white fabric shirt at lower left above pink fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white fabric shirt at lower left is positioned over pink fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf963481409a2f76.jpg", "conversations": [ { "from": "human", "value": "\nIs green jersey at center bigger than black plastic glasses at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green jersey at center is bigger than black plastic glasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1761b0a8a0f19f63.jpg", "conversations": [ { "from": "human", "value": "\nDoes gold metallic ring at center appear over smooth skin at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, gold metallic ring at center is above smooth skin at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb09aab3f29a10d4.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of pink blossoms at center in relation to green leafy forest at left? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1429363900095dcf.jpg", "conversations": [ { "from": "human", "value": "\nIs green jersey at left thinner than white/blue striped jersey at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green jersey at left is not thinner than white/blue striped jersey at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0f8fa69f3335a65.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.800, 0.463) (B) (0.858, 0.694) (C) (0.199, 0.380)" }, { "from": "gpt", "value": "(C) (0.199, 0.380)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74aa4e552c1a0a2e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange fabric neckband at center is positioned above red fabric neckband at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, orange fabric neckband at center is not above red fabric neckband at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fd6fb79d65b84c8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue foam mat at center is positioned below dark gray casual pants at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, blue foam mat at center is positioned under dark gray casual pants at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a0c216ecd32fca2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) gray silk shirt at right (B) blue shirt at center (C) white cotton shirt at center" }, { "from": "gpt", "value": "(B) blue shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e4f1105a1e2e275.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.204, 0.784) (B) (0.566, 0.180)" }, { "from": "gpt", "value": "(B) (0.566, 0.180)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/956f571a27e69ee0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the blue fringed flag at left? Select from: (A) matte black uniform at center (B) blue-white-black flag at upper right" }, { "from": "gpt", "value": "(A) matte black uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2535607926f917bc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if plaid shirt at center is smaller than matte black backpack at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, plaid shirt at center might be larger than matte black backpack at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c53871a336ce7ed.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.587, 0.327) (B) (0.521, 0.391)" }, { "from": "gpt", "value": "(A) (0.587, 0.327)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa8359a9cc89c9eb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) black suit at center (B) brown textured tie at center" }, { "from": "gpt", "value": "(A) black suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1753f9394feb781e.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden climbing net at center appear over red mesh netting at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, wooden climbing net at center is below red mesh netting at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c3cdbcd11494750.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) silky red flag at center (B) matte gray blazer at center (C) clear crystal chandelier at center" }, { "from": "gpt", "value": "(C) clear crystal chandelier at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4dc214ad0f636c10.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) black matte beard at left (B) black fuzzy beard at left (C) green striped sweater at upper center" }, { "from": "gpt", "value": "(C) green striped sweater at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88fdc0e8b10f25bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the green cotton shirt at center? Select from: (A) blue cotton shorts at center (B) pink cotton shirt at center" }, { "from": "gpt", "value": "(A) blue cotton shorts at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d7712e4c5fd472c.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown hair at lower center above teal satin dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/edfd4fdccd2d4100.jpg", "conversations": [ { "from": "human", "value": "\nIs brick pavement at center above printed jersey at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, brick pavement at center is not positioned above printed jersey at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffa9363bc0b1e819.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) white soft fabric baby at center (B) white glossy recreational vehicle at right (C) matte brown jacket at center" }, { "from": "gpt", "value": "(B) white glossy recreational vehicle at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/714296535bf087a0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if asphalt road at center is smaller than striped fabric dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6ab1c6e4640540f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.286, 0.202) (B) (0.722, 0.628)" }, { "from": "gpt", "value": "(B) (0.722, 0.628)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49ceb65890b109d8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.275, 0.406) (B) (0.530, 0.831) (C) (0.237, 0.925)" }, { "from": "gpt", "value": "(B) (0.530, 0.831)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b979b008056aeb58.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if floral fabric armchair at center is positioned to the right of translucent plastic bottle at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, floral fabric armchair at center is to the right of translucent plastic bottle at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/069c586c5edde4c6.jpg", "conversations": [ { "from": "human", "value": "\nDoes dull tan dirt field at center appear over camouflage textured tank at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bdcdd8e665b9e41.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the black leather jacket at center from the following options: (A) clear glass window at upper right (B) metallic fire escape at upper center?" }, { "from": "gpt", "value": "(A) clear glass window at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/098f870aeb596372.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.700, 0.377) (B) (0.569, 0.752)" }, { "from": "gpt", "value": "(A) (0.700, 0.377)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/426e3592112f88f7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue fabric table at center is smaller than gray textured blazer at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, blue fabric table at center is not smaller than gray textured blazer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc79c88c816758b3.jpg", "conversations": [ { "from": "human", "value": "\nDoes snow-covered mountains at upper center have a smaller size compared to green leafy bush at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, snow-covered mountains at upper center is not smaller than green leafy bush at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e91c06cd6b79e4d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.179, 0.822) (B) (0.685, 0.386)" }, { "from": "gpt", "value": "(B) (0.685, 0.386)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06a18dee5f9616cc.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white cotton blouse at center located relative to black plastic speaker at left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5f31ad8b1373e88.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) plaid wool jacket at right (B) matte gray blazer at center (C) black silk tie at center" }, { "from": "gpt", "value": "(C) black silk tie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de9b64a2763e08fa.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at center is bigger than green fabric tent at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green grass at center is larger in size than green fabric tent at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a12b9c31ec6f86cc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.343, 0.525) (B) (0.973, 0.484) (C) (0.182, 0.259)" }, { "from": "gpt", "value": "(C) (0.182, 0.259)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd98c517c790e778.jpg", "conversations": [ { "from": "human", "value": "\nDoes green patina stone at center appear over green patina statue at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, green patina stone at center is below green patina statue at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8edb15a95550a3c.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at upper center wider than light blue metallic truck at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, green leafy tree at upper center's width does not surpass light blue metallic truck at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7d2acba1f4ec0c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white matte boat at lower center (B) smooth wood dock at center (C) white matte boat at center" }, { "from": "gpt", "value": "(C) white matte boat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ae54108212f3fbf.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.381, 0.287) (B) (0.784, 0.414)" }, { "from": "gpt", "value": "(A) (0.381, 0.287)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/839d03c96931de2c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.124, 0.903) (B) (0.148, 0.923) (C) (0.429, 0.945) (D) (0.106, 0.186)" }, { "from": "gpt", "value": "(C) (0.429, 0.945)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff3b403412e506e8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) black textured blazer at center (B) matte black hair at center" }, { "from": "gpt", "value": "(A) black textured blazer at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2cc0571b5ef33155.jpg", "conversations": [ { "from": "human", "value": "\nIs glossy red car at center to the left of blue fabric jacket at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, glossy red car at center is to the right of blue fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b7aca21218d76f3.jpg", "conversations": [ { "from": "human", "value": "\nDoes fuzzy black fur coat at center have a larger size compared to shiny red balloon at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, fuzzy black fur coat at center is larger in size than shiny red balloon at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22b87ae7d52b8049.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white textured shirt at left is wider than sleek silver laptop at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white textured shirt at left's width does not surpass sleek silver laptop at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57f7721c23bf3259.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the yellow fabric flag at upper center? Choose from: (A) white plastic sign at right (B) white fabric flag at upper center (C) white plastic sign at center" }, { "from": "gpt", "value": "(C) white plastic sign at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e66f52e36187994.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.729, 0.905) (B) (0.639, 0.892)" }, { "from": "gpt", "value": "(B) (0.639, 0.892)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d6c4e7ebc4593ba.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) silver/glassy eyeglasses at center-right (B) matte black jacket at center (C) matte black jacket at right (D) black leather jacket at center" }, { "from": "gpt", "value": "(B) matte black jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e790abf50e6cd400.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) golden feathered rooster at center (B) black glossy feathers at right" }, { "from": "gpt", "value": "(B) black glossy feathers at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adc97826bf3b5ad1.jpg", "conversations": [ { "from": "human", "value": "\nDoes denim jacket at lower right appear over sunglasses at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, denim jacket at lower right is not above sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8488d6e0ecacceca.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is metallic steel bridge at upper center located relative to metallic silver accordion at lower left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6fb33178ed887bfa.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the matte black motorcycle at center from the following options: (A) blue matte motorcycle at center (B) silver metallic helmet at center?" }, { "from": "gpt", "value": "(B) silver metallic helmet at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eedb193b6df2d1e4.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the green patina bronze statue at center? Choose from: (A) green patina stone at center (B) metallic gray statue at center" }, { "from": "gpt", "value": "(B) metallic gray statue at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8fce4c0cb9cd679.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if glossy ceramic countertop at upper center is positioned to the right of wooden drawer at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, glossy ceramic countertop at upper center is not on the right side of wooden drawer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5dd418b68b2401fb.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte white projection screen at upper right located in relation to green matte shirt at lower right in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbe0c1a486e9b7a4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.816, 0.234) (B) (0.579, 0.411) (C) (0.243, 0.339)" }, { "from": "gpt", "value": "(C) (0.243, 0.339)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8dc0cb3a28183996.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red plaid shirt at left is thinner than green polished column at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, red plaid shirt at left might be wider than green polished column at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30484439ed55f72e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the cowhide shield at center? Choose among these: (A) matte gold pharaoh at center (B) tan matte camel at right (C) white matte figure at center" }, { "from": "gpt", "value": "(B) tan matte camel at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/421a662b3c051e18.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the smooth suit at center? (A) matte white dress at center (B) floral dress at left (C) smooth white shirt at center" }, { "from": "gpt", "value": "(A) matte white dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/458d6f2c795229c2.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of matte striped shirt at center in reference to black leather swivel chair at left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/306232233fbc407b.jpg", "conversations": [ { "from": "human", "value": "\nDoes sandstone clock tower at upper right appear under green leafy hedge at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, sandstone clock tower at upper right is above green leafy hedge at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fcce71fb66e7068.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte green shirt at lower left have a smaller size compared to curly hair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte green shirt at lower left is smaller than curly hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a79d260bd87d2dda.jpg", "conversations": [ { "from": "human", "value": "\nWhere is shiny silver fish at center located in relation to shiny dark gray fish at center in the image? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82a21af51d87150b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic gray train at center is thinner than dark purple shirt at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, metallic gray train at center might be wider than dark purple shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f78ceee6dd581ff3.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) shiny black sedan at center (B) yellow matte taxi at lower center" }, { "from": "gpt", "value": "(B) yellow matte taxi at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2cc511a90cf0835.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte orange poster at center is thinner than dark brown hair at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, matte orange poster at center might be wider than dark brown hair at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d5867870c1d5044.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green fabric curtain at center is smaller than red-white flag at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1111642ce2fe01af.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) brown crumbly bread at center (B) gray matte t-shirt at center" }, { "from": "gpt", "value": "(B) gray matte t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ddfa4687ecf1c10.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny metallic motorcycle at left closer to camera compared to white matte shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, shiny metallic motorcycle at left is in front of white matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cced317d45f64e2f.jpg", "conversations": [ { "from": "human", "value": "\nIs floral shirt at center positioned before white hat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/958045ccb3c4be6e.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue jacket at upper left to the right of soft fur puppy at upper left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, matte blue jacket at upper left is positioned on the right side of soft fur puppy at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3d13d7cf48c002c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.052, 0.848) (B) (0.108, 0.272)" }, { "from": "gpt", "value": "(B) (0.108, 0.272)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a25d354aab5dfa6.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the white satin suit at center? Choose from: (A) translucent glass bottle at right (B) white floral blouse at center (C) white satin blouse at center" }, { "from": "gpt", "value": "(A) translucent glass bottle at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fae16e0b782226c9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.498, 0.466) (B) (0.828, 0.491) (C) (0.531, 0.522)" }, { "from": "gpt", "value": "(C) (0.531, 0.522)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23ec083f52fc229c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if plaid shirt at left is wider than matte red tank top at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, plaid shirt at left is not wider than matte red tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ad0c7cdab5d28c6.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the bronze statue at center from the following options: (A) red rubber double-decker bus at right (B) blue cotton shirt at lower right?" }, { "from": "gpt", "value": "(A) red rubber double-decker bus at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0278de4434c6ae8c.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the purple knit sweater at center? (A) purple knitted scarf at center (B) purple knitted scarf at left" }, { "from": "gpt", "value": "(B) purple knitted scarf at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8592049229f5b59.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the gold/yellow metal ring at lower center? Select from: (A) yellow rubber band at lower right (B) matte purple pants at center" }, { "from": "gpt", "value": "(B) matte purple pants at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34fb83e78270f937.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy river at lower left to the left of white glossy boat at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find green grassy river at lower left to the left of white glossy boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbc68bccdbabdc04.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if floral fabric curtain at upper left is positioned to the right of mahogany wood coffee table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, floral fabric curtain at upper left is to the left of mahogany wood coffee table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88a0cf49c458a141.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center below green leafy tree at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green leafy tree at center is positioned under green leafy tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d8e7491e4f3bda6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte tree at center is bigger than green leafy trees at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green matte tree at center is not bigger than green leafy trees at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d737740abe3187f7.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of dark gray suit at right in reference to dark gray suit at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f63722149fea348f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.769, 0.298) (B) (0.894, 0.827) (C) (0.135, 0.831)" }, { "from": "gpt", "value": "(C) (0.135, 0.831)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7924c025c36b6497.jpg", "conversations": [ { "from": "human", "value": "\nIs brown knitted hat at right wider than matte yellow jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brown knitted hat at right is wider than matte yellow jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/009d7b2fb1c67a98.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the white satin dress at center? Choose among these: (A) white textured cake at right (B) white satin dress at right" }, { "from": "gpt", "value": "(A) white textured cake at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2baea5a74af3a88f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.508, 0.344) (B) (0.489, 0.419) (C) (0.793, 0.356)" }, { "from": "gpt", "value": "(B) (0.489, 0.419)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a34801a0cc78d81f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.964, 0.961) (B) (0.865, 0.200) (C) (0.011, 0.244) (D) (0.202, 0.548)" }, { "from": "gpt", "value": "(A) (0.964, 0.961)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0d0d33fa7499063.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.568, 0.620) (B) (0.219, 0.341)" }, { "from": "gpt", "value": "(A) (0.568, 0.620)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d22e5ab198b73ef2.jpg", "conversations": [ { "from": "human", "value": "\nIs glossy red van at center positioned at the back of shiny red van at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, glossy red van at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e1f7ef41e1fef86.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the white wooden ladder at left? (A) yellow matte shirt at center (B) matte red heart at center" }, { "from": "gpt", "value": "(B) matte red heart at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8da75bae38bf4cf5.jpg", "conversations": [ { "from": "human", "value": "\nIs matte plastic scoreboard at center to the left of american flag at upper left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte plastic scoreboard at center is not to the left of american flag at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f9bab8b51696085.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the light blue tie-dye shirt at center? Choose from: (A) white creamy food at lower left (B) white matte plate at lower left" }, { "from": "gpt", "value": "(B) white matte plate at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf218ad6c0fcdf8a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.626, 0.722) (B) (0.894, 0.522) (C) (0.391, 0.692) (D) (0.240, 0.662)" }, { "from": "gpt", "value": "(A) (0.626, 0.722)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a72e1416db2f08a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.784, 0.919) (B) (0.626, 0.558)" }, { "from": "gpt", "value": "(A) (0.784, 0.919)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53ccbc12b31a66cb.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) lace dress at center (B) purple lace dress at center" }, { "from": "gpt", "value": "(A) lace dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd8718cadcfda22a.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue sweater at center come in front of weathered wood picnic table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/680358049647255a.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of rusty metal train bridge at left in reference to green matte truck at lower right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e7df2a6c2eea415.jpg", "conversations": [ { "from": "human", "value": "\nIs gold metallic cross at upper center wider than dark brown leather shoes at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, gold metallic cross at upper center might be narrower than dark brown leather shoes at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be64883e637fa428.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the pink shiny dress at center? Choose from: (A) red polka dot fabric ballet skirt at center (B) matte black dress at upper left (C) white fluffy dress at center" }, { "from": "gpt", "value": "(B) matte black dress at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d3e0a28458b1c8f.jpg", "conversations": [ { "from": "human", "value": "\nIs matte plastic projection screen at upper left below denim shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte plastic projection screen at upper left is not below denim shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca50e3b30f04292b.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the green leafy bush at right? Choose from: (A) light brown gravel at center (B) green leafy plant at left" }, { "from": "gpt", "value": "(A) light brown gravel at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f8cedc97e5afbd8.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of white feathered bird at upper left less distant than that of pink feathered flamingo at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white feathered bird at upper left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b007f4574ed1950.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) green leafy tree at lower left (B) green leafy palm at center (C) white stucco tower at center" }, { "from": "gpt", "value": "(C) white stucco tower at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08a789df854e74d4.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green matte tree at center and bronze statue at center in the image provided, where is green matte tree at center located with respect to bronze statue at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99d4b570a16b0f92.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green metallic car at lower center is positioned to the left of green fabric picnic table at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, green metallic car at lower center is to the right of green fabric picnic table at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45b8f7ae2a927c63.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green rough bark tree at upper center is smaller than camouflage jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, green rough bark tree at upper center might be larger than camouflage jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/819f7b96023082d8.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy plant at right have a greater width compared to rustic wood window box at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db9a41f301ca3b32.jpg", "conversations": [ { "from": "human", "value": "\nIs brick pavement at lower left closer to camera compared to shiny metallic cans at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brick pavement at lower left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b951312383a5240a.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown water at center appear over green matte leaves at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/974d0f64f400040e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper center is positioned to the right of white marble clock at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green leafy tree at upper center is positioned on the right side of white marble clock at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4a71af77bf9a4f2.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) black metallic microphone at center (B) black matte cardigan at center" }, { "from": "gpt", "value": "(A) black metallic microphone at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb40f83d9e1a5fc3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.823, 0.431) (B) (0.984, 0.836) (C) (0.112, 0.509) (D) (0.459, 0.772)" }, { "from": "gpt", "value": "(A) (0.823, 0.431)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d133e8b37803ace4.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black jacket at center wider than dark gray sweater at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black jacket at center is wider than dark gray sweater at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0185699b606df2bb.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow straw bales at center below white matte barn at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/189122023b9d2018.jpg", "conversations": [ { "from": "human", "value": "\nIs blue plastic toy truck at center bigger than matte plastic truck at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, blue plastic toy truck at center has a larger size compared to matte plastic truck at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec037cdccbced51c.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy computer screen at upper center appear on the right side of silver metallic laptop at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white glossy computer screen at upper center is to the right of silver metallic laptop at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5afe226df550344e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown wooden dock at center is positioned above white wooden boat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/859310d5e2caa95f.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte duck at center further to camera compared to white matte duck at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1787108cf3905df0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.894, 0.761) (B) (0.139, 0.439)" }, { "from": "gpt", "value": "(B) (0.139, 0.439)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b39feacdf05df93.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the green checkered tablecloth at center? (A) matte peach blouse at center (B) brown fabric baby at center (C) blue plaid shirt at left" }, { "from": "gpt", "value": "(C) blue plaid shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62145703a0b46828.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte jacket at center is positioned to the right of black hoodie at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white matte jacket at center is not to the right of black hoodie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/edc8a134c6c50825.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) matte black shirt at left (B) smooth black dress at center" }, { "from": "gpt", "value": "(B) smooth black dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12ccd13e66586355.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte purple jersey at center is positioned above purple matte jersey at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte purple jersey at center is above purple matte jersey at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6c3a87442ce9ecc.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) green leafy tree at right (B) gray asphalt road at lower left (C) green grassy hillside at center (D) green grassy at center" }, { "from": "gpt", "value": "(C) green grassy hillside at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af8bb93f8d3b0bba.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the plaid kilt at center from the following options: (A) red-white striped fabric flag at left (B) brown leather jacket at center (C) blue striped canopy at upper center (D) matte black kilt at center?" }, { "from": "gpt", "value": "(A) red-white striped fabric flag at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30cce89b34b1244c.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green mossy plant at right in relation to brown rough tree trunk at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13909d11dbe65be8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray metallic pole at left is bigger than white paper at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, gray metallic pole at left is bigger than white paper at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ab7934cb1197634.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) matte red jacket at lower right (B) pink satin hijab at upper left (C) matte red jacket at center (D) brown cotton shirt at center" }, { "from": "gpt", "value": "(B) pink satin hijab at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f63cbb1b8b230213.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.116, 0.386) (B) (0.438, 0.409)" }, { "from": "gpt", "value": "(B) (0.438, 0.409)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b03834c8011a473f.jpg", "conversations": [ { "from": "human", "value": "\nIs silver metallic computer monitor at upper center bigger than silver metallic keyboard at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, silver metallic computer monitor at upper center is bigger than silver metallic keyboard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc3414aff5b6c2c2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if striped fabric shirt at center is thinner than purple checkered shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d86d58d01205105.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) black glossy horse at right (B) high-visibility reflective jacket at center (C) dark blue leather jacket at left" }, { "from": "gpt", "value": "(B) high-visibility reflective jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4269ca909245883d.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of metallic silver car at lower right and white matte car at lower left in the image provided, where is metallic silver car at lower right located with respect to white matte car at lower left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4af6dd42f2567139.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white ceramic cup at lower center and white ceramic mug at lower center in the image provided, where is white ceramic cup at lower center located with respect to white ceramic mug at lower center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f11b927ce43d20c1.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of brown matte branch at center in relation to green leafy tree at upper right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f93e4ed35d21cfc8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.578, 0.559) (B) (0.792, 0.750) (C) (0.212, 0.417)" }, { "from": "gpt", "value": "(A) (0.578, 0.559)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c88527fd9434a0b.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center to the right of gray rock at upper center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green grass at center is positioned on the right side of gray rock at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4932f1366463a032.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the shiny black locomotive at center? (A) white smoke at center (B) matte black train at center" }, { "from": "gpt", "value": "(A) white smoke at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b863d6682dd1eb5e.jpg", "conversations": [ { "from": "human", "value": "\nDoes rusty metal bridge at center have a greater width compared to green leafy tree at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, rusty metal bridge at center has a greater width compared to green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/425a9f317778b051.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.139, 0.686) (B) (0.795, 0.706) (C) (0.745, 0.470)" }, { "from": "gpt", "value": "(C) (0.745, 0.470)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4abd5739e17833e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.191, 0.670) (B) (0.352, 0.536) (C) (0.805, 0.909)" }, { "from": "gpt", "value": "(A) (0.191, 0.670)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ebd7c977a69dcc28.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the white striped shirt at center? (A) white leather suspenders at center (B) white cotton shirt at center" }, { "from": "gpt", "value": "(A) white leather suspenders at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3181fcdde6272944.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is black matte shirt at center located relative to translucent glass beer at right? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2db4d2e78bcd27b7.jpg", "conversations": [ { "from": "human", "value": "\nIs brown cardboard box at center positioned before white plastic bag at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a4a8e33b64bab9b.jpg", "conversations": [ { "from": "human", "value": "\nIs silhouette backpack at left further to camera compared to white paper text at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, silhouette backpack at left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24f755c87ad8516f.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green textured tree at center and dark blue jeans at center in the image provided, where is green textured tree at center located with respect to dark blue jeans at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5062ac73bc6f2413.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.424, 0.839) (B) (0.171, 0.670) (C) (0.065, 0.647)" }, { "from": "gpt", "value": "(A) (0.424, 0.839)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/198e0dcd037a0a8d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow matte arrow at lower left is bigger than metallic pole at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, yellow matte arrow at lower left is not bigger than metallic pole at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cea5c23ac62683e7.jpg", "conversations": [ { "from": "human", "value": "\nDoes checkered fabric shirt at left appear on the left side of clear plastic bottle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, checkered fabric shirt at left is positioned on the left side of clear plastic bottle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/faf12ba81031a096.jpg", "conversations": [ { "from": "human", "value": "\nDoes camouflage uniform at center come in front of camouflage fabric uniform at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f3cdab3840bc680.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of matte black helmet at upper right in reference to black matte walkie-talkie at left? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc144958ab2a65ee.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray textured tree at center is positioned below green grassy field at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dark gray textured tree at center is not below green grassy field at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21df4a883cca423b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark purple fabric stool at lower right is positioned to the right of golden crispy chicken at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, dark purple fabric stool at lower right is to the right of golden crispy chicken at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96e0a444df8115c3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) black matte bowl at lower right (B) matte black boot at center (C) matte black boot at right" }, { "from": "gpt", "value": "(C) matte black boot at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/778c82d716628431.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.224, 0.258) (B) (0.876, 0.709) (C) (0.630, 0.762)" }, { "from": "gpt", "value": "(B) (0.876, 0.709)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82ec278042229bd9.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of yellow matte shirt at center and multicolored plastic blocks at upper center in the image provided, where is yellow matte shirt at center located with respect to multicolored plastic blocks at upper center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffe0f99924fd7751.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is silver metallic bicycle at lower left located relative to shiny metallic bicycle at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c8bc7cf54f64fe8.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the velvet blue and red cape at center? (A) metallic flute at center (B) velvet red coat at left (C) black wood clarinet at center" }, { "from": "gpt", "value": "(B) velvet red coat at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b110c321293965f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) light brown leather jacket at center (B) gray fabric shirt at lower right (C) black cotton shirt at left" }, { "from": "gpt", "value": "(B) gray fabric shirt at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0797a841eca083c8.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at lower left positioned behind red fabric flag at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green grass at lower left is in front of red fabric flag at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15d8f42ea5e7dfcf.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue cotton shirt at center come behind gray fur seal at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44dd7bea0c891a56.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte penguin at lower left below gray rough stone at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, black matte penguin at lower left is not below gray rough stone at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60de01fefd2b8533.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is brown leather belt at lower center located relative to leather/cracked at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1779101859a8be9a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper center is wider than green mossy water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/639635212c01d011.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the polished silver spire at upper center? (A) green leafy tree at left (B) stone gothic cathedral at center (C) green painted metal streetlight at lower center" }, { "from": "gpt", "value": "(B) stone gothic cathedral at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de7cb24b88bb249d.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy grass at lower left positioned at the back of brick wall at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48bc15916ec46755.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) plaid shirt at center (B) matte black jacket at center (C) black satin dress at center, is positioned farthest from the black leather jacket at center?" }, { "from": "gpt", "value": "(B) matte black jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55060959036db692.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white matte tank top at center located in relation to hairy skin tattoo at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8baf3857082351d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.191, 0.470) (B) (0.120, 0.505) (C) (0.088, 0.781) (D) (0.994, 0.244)" }, { "from": "gpt", "value": "(D) (0.994, 0.244)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f8915a0a499ee62.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the gray concrete wall at left? Choose among these: (A) concrete/rough pillar at right (B) rusty metal pillar at center" }, { "from": "gpt", "value": "(B) rusty metal pillar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d528143736007c24.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy palm at center below white marble palace at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55a4769980444ade.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) green leafy forest at center (B) yellow-green leafy tree at lower right" }, { "from": "gpt", "value": "(B) yellow-green leafy tree at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/122647cf9a8e3a6d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) blonde hair vest at lower left (B) green fabric flower girl at lower right (C) satin/sheer white dress at center" }, { "from": "gpt", "value": "(C) satin/sheer white dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2de661bfdc12a1f9.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center have a lesser width compared to blue matte shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green grass at center is not thinner than blue matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9ecf561b95cd365.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte plastic tub at center is wider than shiny gold foil at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5853512ff4194bc5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte broccoli at center is positioned to the right of shiny red sauce at top right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green matte broccoli at center is not to the right of shiny red sauce at top right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fad63140bacb6dad.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.368, 0.194) (B) (0.352, 0.475) (C) (0.197, 0.548) (D) (0.124, 0.605)" }, { "from": "gpt", "value": "(D) (0.124, 0.605)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3b5f860685066f8.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black suit at center appear over white matte mug at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ec4f2496a3c8b7c.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow wood boat at lower left wider than green wooden boat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, yellow wood boat at lower left has a greater width compared to green wooden boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b658c96945174b58.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) light beige fabric bag at lower right (B) green grass at lower center (C) matte white blouse at lower center (D) khaki uniform at center" }, { "from": "gpt", "value": "(D) khaki uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e97fbfe240047b75.jpg", "conversations": [ { "from": "human", "value": "\nIs rusty metal water at upper center bigger than yellow metallic excavator at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, rusty metal water at upper center is larger in size than yellow metallic excavator at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8becd0b2f4c07b9c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) satin dress at center (B) black lace dress at center (C) white feather boa at right" }, { "from": "gpt", "value": "(B) black lace dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/146b8fc9475c9eb0.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.661, 0.759) (B) (0.307, 0.081)" }, { "from": "gpt", "value": "(A) (0.661, 0.759)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/150713529aa05ba8.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is shiny blue uniform at right located relative to shiny dark blue uniform at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0b1bc9ff03de8af.jpg", "conversations": [ { "from": "human", "value": "\nDoes gold brocade robe at center appear under gold lacquered statue at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b82b4b22ea94193d.jpg", "conversations": [ { "from": "human", "value": "\nIs slate gray concrete at center thinner than matte gray dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, slate gray concrete at center's width is not less than matte gray dress at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c722deb4a1a8b4be.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver chain at left come behind silver metallic chain at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df23410d59712f4c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.032, 0.680) (B) (0.894, 0.423)" }, { "from": "gpt", "value": "(B) (0.894, 0.423)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/641678688a360235.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the matte skin hand at center? Select from: (A) striped jersey at center (B) matte striped shirt at center" }, { "from": "gpt", "value": "(A) striped jersey at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9500df4e64b2377.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow matte shirt at center is wider than denim jeans at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, yellow matte shirt at center has a greater width compared to denim jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b6c9a2491a2f52a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the white marble column at center? (A) stone/concrete mausoleum at center (B) white stone column at center (C) matte glass door at center (D) smooth gray stone church at left" }, { "from": "gpt", "value": "(C) matte glass door at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/077019a15b0dfdcf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.331, 0.556) (B) (0.200, 0.186)" }, { "from": "gpt", "value": "(A) (0.331, 0.556)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e15abebf8ebb8b9e.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center lie in front of orange matte vest at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green grass at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8df37ccb3cbce20a.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden chair at center thinner than metallic brown chair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, wooden chair at center has a lesser width compared to metallic brown chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3cefdb5cf935c10.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) smooth black telegraph pole at center (B) brown leafy tree at lower right" }, { "from": "gpt", "value": "(A) smooth black telegraph pole at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f2454606ada880e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green leafy tree at upper center (B) bare wood tree at upper right (C) green grassy field at center" }, { "from": "gpt", "value": "(B) bare wood tree at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/752472659f2b334b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black velvet dress at center is bigger than white floral bouquet at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4af5324e9a0fcc40.jpg", "conversations": [ { "from": "human", "value": "\nIs white water at center to the left of matte black jacket at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white water at center is not to the left of matte black jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/185040328258f153.jpg", "conversations": [ { "from": "human", "value": "\nIs sandstone statue at center above matte stone nose at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, sandstone statue at center is not positioned above matte stone nose at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/773d3ece775716a8.jpg", "conversations": [ { "from": "human", "value": "\nIs brown wooden shutter at left bigger than light blue shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29ffe2152326da14.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue shirt at center closer to the viewer compared to light blue cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte blue shirt at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e3bcaa311ae6271.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.800, 0.328) (B) (0.312, 0.741) (C) (0.656, 0.541)" }, { "from": "gpt", "value": "(B) (0.312, 0.741)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30c409cd4b9d6307.jpg", "conversations": [ { "from": "human", "value": "\nDoes white lined paper at center appear under green ceramic mug at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white lined paper at center is not below green ceramic mug at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f078b917012e2124.jpg", "conversations": [ { "from": "human", "value": "\nIs black and tan fur puppy at center behind black and white fur at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43ba12d94a8872f9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) green wood pole at right (B) white metallic flag pole at left (C) red-white-striped flag at upper left" }, { "from": "gpt", "value": "(A) green wood pole at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9fc0e97a30533572.jpg", "conversations": [ { "from": "human", "value": "\nIs clear glass door at center in front of black rubber mat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09ec32608cf39bf9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.982, 0.241) (B) (0.249, 0.569)" }, { "from": "gpt", "value": "(B) (0.249, 0.569)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d6a6c834e7de216.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the blue striped shirt at center? Select from: (A) orange checkered shirt at center (B) white satin blouse at center (C) satin blue suit at left" }, { "from": "gpt", "value": "(A) orange checkered shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa59647a3f656210.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white striped pants at center located relative to brown wooden stool at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/556dde93054dde15.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) dark gray fabric shirt at center (B) brown textured shorts at center (C) green concrete river at center (D) smooth skin man at lower center" }, { "from": "gpt", "value": "(D) smooth skin man at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c7e110f089636e5.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue shirt at center have a lesser width compared to khaki fabric uniform at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, dark blue shirt at center is thinner than khaki fabric uniform at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/289cb2bfd6ebbc3e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the matte red shorts at center among (A) dark blue fabric pants at center (B) white mesh shirt at center (C) matte blue jersey at center?" }, { "from": "gpt", "value": "(B) white mesh shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a250334a4378fbde.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark gray fabric bag at lower left located in relation to white uniform shirt at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2caefb60d5fd1974.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black vest at center is wider than shiny red fabric dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black vest at center is wider than shiny red fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37505aee043f5460.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) black matte shirt at lower right (B) black matte dress at lower center (C) black leather jacket at center (D) concrete sidewalk at lower center" }, { "from": "gpt", "value": "(D) concrete sidewalk at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41953ea2818ef654.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent plastic bottle at lower left in front of black metallic microphone at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, transparent plastic bottle at lower left is in front of black metallic microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0747e2acb05c22f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) cloudy sky at center (B) shiny metallic tower at center" }, { "from": "gpt", "value": "(B) shiny metallic tower at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/094187003ad2e09e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the dark gray textured suit at center among (A) brown wool suit at right (B) gray wool suit at left (C) gray pinstripe suit at left?" }, { "from": "gpt", "value": "(A) brown wool suit at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2a194151f267755.jpg", "conversations": [ { "from": "human", "value": "\nIs green plaid scarf at center thinner than green plaid fabric at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green plaid scarf at center has a lesser width compared to green plaid fabric at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d096892c75d1df0.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden stringed instrument at lower left bigger than silver metallic laptop at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, wooden stringed instrument at lower left is larger in size than silver metallic laptop at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04c2f5c20e60cb4f.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte shirt at center have a greater width compared to wooden at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/445f7937ce2fe6be.jpg", "conversations": [ { "from": "human", "value": "\nIs tan wool blazer at center to the right of matte black suit at upper left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, tan wool blazer at center is positioned on the right side of matte black suit at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f73fa6a3ba990ad.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.855, 0.770) (B) (0.703, 0.967)" }, { "from": "gpt", "value": "(B) (0.703, 0.967)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23db66a6b131a1d7.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.254, 0.155) (B) (0.108, 0.802) (C) (0.741, 0.261)" }, { "from": "gpt", "value": "(B) (0.108, 0.802)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4977ee44701d2b6f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) flannel shirt at right (B) metallic mesh trampoline at center" }, { "from": "gpt", "value": "(A) flannel shirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa93b20a550bbcda.jpg", "conversations": [ { "from": "human", "value": "\nIs earthy brown rock at center to the left of denim jacket at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, earthy brown rock at center is to the left of denim jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b9e03541264cb9c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte skin at center (B) matte black nose at center (C) matte white sunglasses at center (D) glossy black helmet at center" }, { "from": "gpt", "value": "(A) matte skin at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6c0b932110175e8.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric headscarf at upper right positioned before light brown skin child at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/619730922737097c.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the brown suede shoe at lower left from the following options: (A) suede/leather shoe at lower center (B) green grass at lower center?" }, { "from": "gpt", "value": "(B) green grass at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2fcc84847528e8d8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.545, 0.470) (B) (0.031, 0.241) (C) (0.415, 0.541)" }, { "from": "gpt", "value": "(C) (0.415, 0.541)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75fa969a51f4923f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) wooden at center (B) striped shirt at center (C) dark blue jeans at center" }, { "from": "gpt", "value": "(B) striped shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5530578ff2d132c.jpg", "conversations": [ { "from": "human", "value": "\nIs rusty metal gear at center closer to camera compared to rusty white gear at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, rusty metal gear at center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc63fbd1cf93603c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.281, 0.655) (B) (0.108, 0.348) (C) (0.140, 0.812) (D) (0.016, 0.739)" }, { "from": "gpt", "value": "(D) (0.016, 0.739)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e37253bf5a77603a.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green matte train car at center in relation to matte black locomotive at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36caa2a214cda143.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of green leafy palm tree at left in reference to silver metallic truck at lower left? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46c266d6a37620ae.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) beige stone tower at upper left (B) white fabric banner at center" }, { "from": "gpt", "value": "(B) white fabric banner at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c9b778d0be5525f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) stained glass lampshade at upper center (B) clear glass window at center, is positioned closest to the white plastic chair at center?" }, { "from": "gpt", "value": "(B) clear glass window at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/409b07397e920747.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.728, 0.383) (B) (0.363, 0.994) (C) (0.640, 0.909)" }, { "from": "gpt", "value": "(A) (0.728, 0.383)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce22214494b0653b.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of black chalkboard at upper left and matte plastic pastry at center in the image provided, where is black chalkboard at upper left located with respect to matte plastic pastry at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/215f6d864228c073.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the weathered wood ladder at center? (A) smooth concrete hut at center (B) matte red shirt at upper center" }, { "from": "gpt", "value": "(B) matte red shirt at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b90bc856c2b395b.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the blue plaid shirt at center? Choose from: (A) wooden table at center (B) white cream cake at lower left" }, { "from": "gpt", "value": "(A) wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb45c9a957038ac4.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the gray matte blazer at center from the following options: (A) black metallic microphone at center (B) light blue shirt at left (C) red plastic table at center?" }, { "from": "gpt", "value": "(B) light blue shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8712e83c92400367.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy branches at upper center is bigger than glistening blue water at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green leafy branches at upper center has a larger size compared to glistening blue water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4e22b87e6152ca0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.641, 0.491) (B) (0.205, 0.545)" }, { "from": "gpt", "value": "(A) (0.641, 0.491)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c16ff815b2f81b21.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of green matte shirt at center in reference to brown fur dog at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3cd17b9a65b75ec.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte tree at center is positioned above rocky snow-covered peak at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, green matte tree at center is not positioned above rocky snow-covered peak at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efe253bdd72d9b55.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) brown dirt track at center-right (B) metallic silver tower at upper left (C) brown leather pants at lower right" }, { "from": "gpt", "value": "(C) brown leather pants at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed36d617a72e5ff9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the shiny black motorcycle at center? Choose among these: (A) concrete at lower center (B) metallic silver motorcycle at center (C) shiny metallic motorcycle at center" }, { "from": "gpt", "value": "(B) metallic silver motorcycle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a9c9859ed9963e5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.647, 0.758) (B) (0.306, 0.619)" }, { "from": "gpt", "value": "(B) (0.306, 0.619)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/137233d6d5a869c3.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the yellow matte crayon at center among (A) yellow plastic crayon at lower center (B) wooden table at center?" }, { "from": "gpt", "value": "(B) wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45e08728c9437916.jpg", "conversations": [ { "from": "human", "value": "\nIs blue painted asphalt at lower center thinner than dark brown cotton shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, blue painted asphalt at lower center might be wider than dark brown cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3d6b57618a04dcd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.839, 0.973) (B) (0.285, 0.831) (C) (0.045, 0.677)" }, { "from": "gpt", "value": "(B) (0.285, 0.831)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d02b150c852203e.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grassy field at center have a greater width compared to green leafy tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92c9f6e87287b6cf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) teal fleece jacket at center (B) green fleece jacket at left (C) black fleece jacket at center" }, { "from": "gpt", "value": "(C) black fleece jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd3ae5ea28fd3257.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black screen at right lie in front of metallic silver frame at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black screen at right is behind metallic silver frame at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e76528d597378bf7.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the dark gray suit at left? (A) wooden table at center (B) black matte jacket at upper center" }, { "from": "gpt", "value": "(B) black matte jacket at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d79b5e70b477489.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grassy wheat field at center is wider than white fluffy cloud at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green grassy wheat field at center is not wider than white fluffy cloud at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a15105ac3af3f0cb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.404, 0.594) (B) (0.778, 0.795)" }, { "from": "gpt", "value": "(B) (0.778, 0.795)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c34c4a692d4ea17.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green leafy trees at upper left (B) clear wire at upper center (C) green leafy tree at lower right" }, { "from": "gpt", "value": "(C) green leafy tree at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aea34096c7e74eb7.jpg", "conversations": [ { "from": "human", "value": "\nDoes white textured dress at center appear under white cotton dress at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, white textured dress at center is located below white cotton dress at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd73269163bf17e5.jpg", "conversations": [ { "from": "human", "value": "\nIs black rock at center to the left of blue water at upper center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, black rock at center is positioned on the left side of blue water at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41d8f4bf9e50d88e.jpg", "conversations": [ { "from": "human", "value": "\nIs camouflage fabric uniform at upper center positioned at the back of tan matte rifle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, camouflage fabric uniform at upper center is behind tan matte rifle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86b59aaecffb4c95.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.456, 0.698) (B) (0.815, 0.216)" }, { "from": "gpt", "value": "(A) (0.456, 0.698)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1c09534e084cf40.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown and white fur at lower center appear on the left side of wooden table at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, brown and white fur at lower center is positioned on the left side of wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fc7611b79991c81.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray suit at center is wider than matte black suit at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79012568adc2a39a.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue denim jeans at center have a smaller size compared to dark blue jeans at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, blue denim jeans at center is not smaller than dark blue jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd0ba4f7a8e258d9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.648, 0.787) (B) (0.016, 0.542)" }, { "from": "gpt", "value": "(B) (0.016, 0.542)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb181a129c45e297.jpg", "conversations": [ { "from": "human", "value": "\nDoes zebra-patterned dress at center appear on the right side of matte black necklace at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find zebra-patterned dress at center to the right of matte black necklace at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b4e2baae7c1b3e9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.585, 0.627) (B) (0.444, 0.464)" }, { "from": "gpt", "value": "(A) (0.585, 0.627)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57d801581566ffba.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) blonde hair at center (B) matte white shirt at left (C) white striped shirt at upper right (D) clear glass at right" }, { "from": "gpt", "value": "(C) white striped shirt at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea4e8a5e19c8ef7b.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the red stone railing at center from the following options: (A) pink stone building at center (B) mosaic tile dome at upper center?" }, { "from": "gpt", "value": "(A) pink stone building at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1918ce8b6f00887c.jpg", "conversations": [ { "from": "human", "value": "\nIs concrete ledge at center to the left of denim jacket at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, concrete ledge at center is to the left of denim jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d31e4f3bd10831a4.jpg", "conversations": [ { "from": "human", "value": "\nIs argyle sweater at center bigger than floral print blouse at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, argyle sweater at center is larger in size than floral print blouse at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51ea11ba365c6e7b.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown wooden table at center have a lesser width compared to yellow matte shirt at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, brown wooden table at center is not thinner than yellow matte shirt at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d8f7b5fcf66bdbc.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte building at center have a smaller size compared to blue metallic boat at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8a93359c52c34db.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.186, 0.533) (B) (0.583, 0.523) (C) (0.662, 0.558) (D) (0.782, 0.917)" }, { "from": "gpt", "value": "(B) (0.583, 0.523)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0147e12e50998cc1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark wool suit at left is wider than silver metallic suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of dark wool suit at left exceeds that of silver metallic suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f642cffbedc7980d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.128, 0.211) (B) (0.601, 0.723)" }, { "from": "gpt", "value": "(A) (0.128, 0.211)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eaa6fc4015821a8d.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden frame at upper left appear under yellow matte food at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, wooden frame at upper left is above yellow matte food at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e464bc5794ce049.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the camouflage fabric uniform at center from the following options: (A) camouflage uniform at center (B) yellowmattesign at center (C) camouflage fabric uniform at right (D) camouflage fabric uniform at left?" }, { "from": "gpt", "value": "(D) camouflage fabric uniform at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5e49e44d84777d1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte nylon jacket at center (B) white matte door at center" }, { "from": "gpt", "value": "(B) white matte door at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/baa55b985737754e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.690, 0.933) (B) (0.740, 0.809)" }, { "from": "gpt", "value": "(B) (0.740, 0.809)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6587e5b7b1bc644e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green soft sweater at center is bigger than green velvety sweatshirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green soft sweater at center is bigger than green velvety sweatshirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/020187f9b80253a0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) brown dry hay at center (B) blue plaid shirt at center (C) matte gray vest at left" }, { "from": "gpt", "value": "(A) brown dry hay at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/980277b13b39fa32.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte jacket at center wider than orange cleats at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black matte jacket at center's width does not surpass orange cleats at right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e59ac6ba4621a581.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte blue jersey at center in relation to black and white striped shirt at left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f066fb71f8f8ee28.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red coat at center bigger than matte black jacket at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte red coat at center is larger in size than matte black jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a40cd108a404135c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) green mossy river at center (B) rustic wooden bridge at center" }, { "from": "gpt", "value": "(B) rustic wooden bridge at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bc63d53445b51e0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte white screen at center is smaller than white fabric flag at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte white screen at center is not smaller than white fabric flag at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a880068a856f48f2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth blue shirt at center is positioned above hardcover book at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, smooth blue shirt at center is positioned over hardcover book at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2aa071f3d701590.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.603, 0.219) (B) (0.461, 0.359)" }, { "from": "gpt", "value": "(A) (0.603, 0.219)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7820d140f82150ff.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) metal at center (B) blue shirt at right (C) matte black shirt at center" }, { "from": "gpt", "value": "(A) metal at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ad88181dacce324.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of quilted black jacket at center in relation to dark gray quilted jacket at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01b23ed77f4ffacf.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) blue metallic ski suit at left (B) black matte ski at center" }, { "from": "gpt", "value": "(A) blue metallic ski suit at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83b3da30d60ce34f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white glossy mug at center (B) translucent ceramic cup at center (C) matte white saucer at lower center (D) white glossy teapot at center" }, { "from": "gpt", "value": "(B) translucent ceramic cup at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5e00b869dee2b5a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.155, 0.719) (B) (0.508, 0.528) (C) (0.526, 0.963)" }, { "from": "gpt", "value": "(A) (0.155, 0.719)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24bed5e9fc62d4b2.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.227, 0.816) (B) (0.191, 0.489) (C) (0.338, 0.439) (D) (0.108, 0.545)" }, { "from": "gpt", "value": "(A) (0.227, 0.816)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67001ab7ccd10263.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) orange matte pumpkin at lower left (B) black and white spotted cows at center (C) orange matte pumpkin at lower center" }, { "from": "gpt", "value": "(B) black and white spotted cows at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd7de35fdd03056e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) wooden gazebo at center (B) golden fur lion at center" }, { "from": "gpt", "value": "(B) golden fur lion at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c88805b76a5c2f73.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green fabric dress at center is positioned below white matte cake at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green fabric dress at center is not below white matte cake at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00745e321470b42c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) blue matte helmet at center (B) shiny pink bicycle at center" }, { "from": "gpt", "value": "(A) blue matte helmet at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/163c51b75f4b04a3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the green painted wood figure at left? (A) pink silk robe at center (B) orange painted wood rail at center (C) matte brown robe at center" }, { "from": "gpt", "value": "(B) orange painted wood rail at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27c20421051467f8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if pink fabric pants at center is bigger than light blue fabric pants at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, pink fabric pants at center is larger in size than light blue fabric pants at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b730fa4382441c89.jpg", "conversations": [ { "from": "human", "value": "\nDoes velvet maroon and gray graduation gown at center have a lesser width compared to black matte graduation gown at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, velvet maroon and gray graduation gown at center might be wider than black matte graduation gown at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7ef554e1c345a06.jpg", "conversations": [ { "from": "human", "value": "\nWhere is gray fabric bag at center located in relation to dark blue fabric coat at center in the image? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e474f02c881db26.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) black rubber stairs at left (B) smooth concrete stairs at center" }, { "from": "gpt", "value": "(A) black rubber stairs at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0a8b996f577e4a4.jpg", "conversations": [ { "from": "human", "value": "\nIs white fabric dress at center thinner than suede couch at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, white fabric dress at center might be wider than suede couch at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b42fe0854b7103af.jpg", "conversations": [ { "from": "human", "value": "\nIs blue water at center wider than polished brass streetlamp at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of blue water at center exceeds that of polished brass streetlamp at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67707bfd6ddbd10c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth concrete river at center is positioned to the right of rusty wood dock at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, smooth concrete river at center is to the left of rusty wood dock at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b17b577d353aba9.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear water at lower left appear on the right side of light brown gravel at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, clear water at lower left is to the right of light brown gravel at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/232d1cbbdc4149f1.jpg", "conversations": [ { "from": "human", "value": "\nDoes black leather jacket at lower left appear over dark blue jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, black leather jacket at lower left is below dark blue jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1019b6c4da5266fb.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) sandy beach at lower right (B) clear blue water at lower left" }, { "from": "gpt", "value": "(A) sandy beach at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0aa187eff493c62.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the white matte bag at center? Choose among these: (A) orange fabric shirt at center (B) light blue fabric shirt at center" }, { "from": "gpt", "value": "(B) light blue fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5527832ce7d44a1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) green uniform at center (B) matte black rifle at center (C) green fabric vest at center (D) blue fabric jacket at upper left" }, { "from": "gpt", "value": "(D) blue fabric jacket at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1b0764067dab1e5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if fluffy fur cat at center is positioned to the right of black plastic remote at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, fluffy fur cat at center is to the left of black plastic remote at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/953393c7827fcafd.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of black fabric flag at left and green fabric flag at upper right in the image provided, where is black fabric flag at left located with respect to green fabric flag at upper right? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0cc4637ac0155000.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of khaki fabric cap at center and red leather shoe at lower left in the image provided, where is khaki fabric cap at center located with respect to red leather shoe at lower left? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/637284615ac1a0ea.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.538, 0.828) (B) (0.464, 0.330)" }, { "from": "gpt", "value": "(A) (0.538, 0.828)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f78bb1ddb69b9e4b.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte jacket at center to the right of black reflective sunglasses at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find black matte jacket at center to the right of black reflective sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c830313e7add71f9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) pink satin sandal at lower right (B) blonde hair at upper center (C) white cotton skirt at center" }, { "from": "gpt", "value": "(A) pink satin sandal at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/715e0f368b07dc71.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white fleece hoodie at left is thinner than yellow-orange robe at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white fleece hoodie at left is not thinner than yellow-orange robe at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d9c95ec1c2d5e67.jpg", "conversations": [ { "from": "human", "value": "\nDoes white plastic turntable at center have a larger size compared to blue plastic homer simpson figurine at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5c49833eade1936.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the denim shirt at center? Choose among these: (A) black and white striped dress at center (B) blue checkered shirt at center (C) blue chambray shirt at center" }, { "from": "gpt", "value": "(A) black and white striped dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f80828e550d1b0c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.335, 0.167) (B) (0.685, 0.453) (C) (0.053, 0.752) (D) (0.074, 0.425)" }, { "from": "gpt", "value": "(C) (0.053, 0.752)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d424b539d536b05.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of gray textured rhino at center in relation to matte gray rhino at left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e23d7970c9d7e3e.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden stairs at center come behind green fabric sleeping bag at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of green fabric sleeping bag at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0e8ea0c7a82cc80.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.710, 0.602) (B) (0.216, 0.627)" }, { "from": "gpt", "value": "(A) (0.710, 0.602)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/356dcce217dae3ad.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte graduation cap at lower left bigger than black satin gown at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, black matte graduation cap at lower left might be smaller than black satin gown at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6bdb4002e944869.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white fluffy cloud at upper center located in relation to brick chimney at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1caab6d2a8f9a4ab.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the green coniferous trees at center? Choose from: (A) snowy granite mountain at left (B) green leafy tree at lower left" }, { "from": "gpt", "value": "(B) green leafy tree at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/329c8b3fabd38163.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) red brick castle at center (B) dark blue suit at left" }, { "from": "gpt", "value": "(A) red brick castle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9a4ee67457d7e09.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.862, 0.659) (B) (0.656, 0.948)" }, { "from": "gpt", "value": "(A) (0.862, 0.659)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0418bcafee9a1f8.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte screen at center appear on the right side of light blue shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green matte screen at center is not to the right of light blue shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29a1bb56652a90c8.jpg", "conversations": [ { "from": "human", "value": "\nIs orange lanyard at right thinner than silver metallic laptop at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, orange lanyard at right is not thinner than silver metallic laptop at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41c0f6cf358f183c.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the pink floral bed at center? Choose from: (A) pink fabric at center (B) dark gray fabric jacket at center (C) black fabric stroller at center (D) black asphalt path at center" }, { "from": "gpt", "value": "(C) black fabric stroller at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01c5fc1b56dace92.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the dark brown bark at center among (A) gray pinstripe suit at center (B) satin white dress at upper left?" }, { "from": "gpt", "value": "(A) gray pinstripe suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/673ec3114e2490bf.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.378, 0.283) (B) (0.284, 0.547) (C) (0.596, 0.730)" }, { "from": "gpt", "value": "(A) (0.378, 0.283)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5b7c489056ee0e1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte red shirt at left is positioned below gray matte shirt at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, matte red shirt at left is positioned under gray matte shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05a04c98bcf81cdc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red matte jacket at center is positioned below metallic gray helicopter at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, red matte jacket at center is below metallic gray helicopter at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5181898dc76b8761.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of green grass at center in reference to gray fleece sweatshirt at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8611aeab9386d711.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray striped cat at center come behind white matte flower at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b03ae56a1a1c055.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.513, 0.608) (B) (0.323, 0.398)" }, { "from": "gpt", "value": "(A) (0.513, 0.608)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d01950376150fd0e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.852, 0.320) (B) (0.260, 0.611) (C) (0.106, 0.886)" }, { "from": "gpt", "value": "(C) (0.106, 0.886)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f6613aca277b409.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.862, 0.397) (B) (0.176, 0.938)" }, { "from": "gpt", "value": "(B) (0.176, 0.938)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/255a9b3411948907.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray scaly dinosaur at center lie behind gray textured dinosaur at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c2b9396e3a9ad7e.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the matte black phone at center? Choose from: (A) matte black camera at center (B) strawhat at center (C) brushed metal camera at left" }, { "from": "gpt", "value": "(A) matte black camera at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d74017e61bfcc0fd.jpg", "conversations": [ { "from": "human", "value": "\nIs brown cotton shirt at center above brown and white fur goat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, brown cotton shirt at center is not above brown and white fur goat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0a2d035db62e8dc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) clear water at lower center (B) pink matte swimsuit at center (C) pink fabric swimsuit at lower center (D) white matte t-shirt at lower center" }, { "from": "gpt", "value": "(C) pink fabric swimsuit at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a2c7b2abc54a49f.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white painted steel bridge at center located relative to white glossy boat at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8eafd974ac7df62c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) orange fabric shirt at center (B) black cotton shirt at center" }, { "from": "gpt", "value": "(B) black cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5de5900a71f96bc1.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the dark brown hair at center? (A) dark brown hair at upper right (B) green matte jacket at left" }, { "from": "gpt", "value": "(B) green matte jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bd0ffd346cc4c8a.jpg", "conversations": [ { "from": "human", "value": "\nIs matte green truck at center smaller than brown matte figure at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte green truck at center is not smaller than brown matte figure at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b16f07f95924be3.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the green matte tree at center among (A) brown rough bark tree at right (B) transparent water at center?" }, { "from": "gpt", "value": "(A) brown rough bark tree at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/619d4237899c7a93.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) rough bark tree trunk at left (B) green leafy tree at center (C) spotted fur leopard at center, is positioned farthest from the brown rough log at center?" }, { "from": "gpt", "value": "(A) rough bark tree trunk at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1aad755a63beabd3.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green leafy palm tree at upper left and black metal cross at center in the image provided, where is green leafy palm tree at upper left located with respect to black metal cross at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc8f5f5a3a05a63d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) striped cotton shirt at center (B) white plastic chair at lower left (C) matte black dress at upper center, is positioned closest to the matte black shirt at upper left?" }, { "from": "gpt", "value": "(B) white plastic chair at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cfa208eaff9c678.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the matte black bag at center? (A) purple fabric bag at left (B) black uniform at center" }, { "from": "gpt", "value": "(B) black uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85422ba994a35d74.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) black leather jacket at right (B) black lace dress at center" }, { "from": "gpt", "value": "(B) black lace dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b154c0ffa0e6cf7.jpg", "conversations": [ { "from": "human", "value": "\nDoes white striped shirt at center have a lesser width compared to dark gray wicker couch at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white striped shirt at center's width is not less than dark gray wicker couch at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01d46638484e5be6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) white bread at center (B) white tulle dress at center (C) black lace dress at left (D) pink floral dress at center, is positioned farthest from the blue lace dress at center?" }, { "from": "gpt", "value": "(A) white bread at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c495fcf48535814b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.667, 0.481) (B) (0.714, 0.544) (C) (0.390, 0.614) (D) (0.281, 0.748)" }, { "from": "gpt", "value": "(C) (0.390, 0.614)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fa8fc10251a40d8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) wooden table at center (B) white creamy salad at upper left (C) brown matte potatoes at center (D) white matte potatoes at center" }, { "from": "gpt", "value": "(A) wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46d5bcf4b7275251.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center lie behind glistening water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green leafy tree at center is in front of glistening water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/893c56c3642f6e46.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) matte black shirt at upper left (B) brown paper bag at upper center (C) blue plaid shirt at upper right" }, { "from": "gpt", "value": "(A) matte black shirt at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0cfe2e23703a5b4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.200, 0.608) (B) (0.144, 0.589) (C) (0.661, 0.469)" }, { "from": "gpt", "value": "(A) (0.200, 0.608)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45eee1826b05594a.jpg", "conversations": [ { "from": "human", "value": "\nIs brown stone church at center positioned in front of dark blue backpack at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, brown stone church at center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8386ef22524a0a5b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) clear water at lower left (B) green leafy palm tree at upper right" }, { "from": "gpt", "value": "(A) clear water at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4b74369fde399d8.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the dark gray metallic pipe at center? (A) blue fabric jacket at center (B) matte black helmet at center" }, { "from": "gpt", "value": "(B) matte black helmet at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e5824aa9201e3e0.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth sandstone rocks at center further to the viewer compared to green matte tree at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of green matte tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86b0891a4047415e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray wool coat at right is wider than light beige wool coat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6d5731ba1bb9380.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the dark wool coat at center? (A) dark gray coat at center (B) matte black coat at center" }, { "from": "gpt", "value": "(A) dark gray coat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9382c0831b94be4.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.999, 0.058) (B) (0.409, 0.144)" }, { "from": "gpt", "value": "(B) (0.409, 0.144)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2807ab3faa1eb96b.jpg", "conversations": [ { "from": "human", "value": "\nIs dark blue suit at center positioned in front of black matte suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa539396e22f5459.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) yellow plastic slide at right (B) pink fabric swing at center (C) matte black swing at center, is positioned closest to the pink satin dress at center?" }, { "from": "gpt", "value": "(C) matte black swing at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7671b36049943930.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.893, 0.828) (B) (0.237, 0.561) (C) (0.324, 0.286)" }, { "from": "gpt", "value": "(A) (0.893, 0.828)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b60fbe14cceb4e3a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) matte black jacket at upper left (B) black leather jacket at left (C) glossy green ferrari at center (D) black plastic license plate at center, is positioned farthest from the leather jacket at upper center?" }, { "from": "gpt", "value": "(B) black leather jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c3eab971023475c.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte gray sweater at center appear under white plastic clipboard at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b19dfdd0cf36f0cc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte dark suit at left is wider than matte gray dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte dark suit at left is wider than matte gray dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0960504b2dad911c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the striped cotton shirt at lower right? (A) multicolored fabric seats at center (B) blue fabric shorts at center" }, { "from": "gpt", "value": "(A) multicolored fabric seats at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abcbb0987a4aa248.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if translucent water at center is thinner than green leafy tree at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df505da4a7af1d16.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic maroon pickup truck at lower right bigger than shiny red sedan at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, metallic maroon pickup truck at lower right is not larger than shiny red sedan at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7f6aa09d4524146.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.992, 0.091) (B) (0.573, 0.683)" }, { "from": "gpt", "value": "(B) (0.573, 0.683)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/048611ebe9fd46e0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grassy at center is wider than brown rough bark tree at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green grassy at center is wider than brown rough bark tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3915af3f66dd3076.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.946, 0.659) (B) (0.251, 0.753)" }, { "from": "gpt", "value": "(B) (0.251, 0.753)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efdfc409f8de1402.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.138, 0.683) (B) (0.195, 0.537) (C) (0.459, 0.242) (D) (0.772, 0.866)" }, { "from": "gpt", "value": "(C) (0.459, 0.242)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b2b52d50041c311.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fluffy snow at lower center have a smaller size compared to brown fur at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, white fluffy snow at lower center might be larger than brown fur at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35b7c8b8fa2a709f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) teal matte jacket at center (B) matte black jacket at left" }, { "from": "gpt", "value": "(A) teal matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/899012f5eea7c719.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.175, 0.555) (B) (0.781, 0.320)" }, { "from": "gpt", "value": "(B) (0.781, 0.320)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddac49ac37b9ad4c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green plastic street sign at upper center is bigger than metallic pole at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green plastic street sign at upper center is not larger than metallic pole at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4136ba9dbe9516c5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic gray drawer at left is positioned to the right of green glass bottle at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find metallic gray drawer at left to the right of green glass bottle at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e84f18d39e181a83.jpg", "conversations": [ { "from": "human", "value": "\nIs green tie-dye shirt at center in front of matte black blazer at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green tie-dye shirt at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ad1117fbf31417b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte gray shirt at center (B) denim jeans at center (C) purple fleece jacket at center" }, { "from": "gpt", "value": "(A) matte gray shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b393d7f43b3b7795.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) black matte ship at left (B) brown matte water at lower left" }, { "from": "gpt", "value": "(B) brown matte water at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7cc11cc538b9acb.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of black painted text at center and red matte boat at center in the image provided, where is black painted text at center located with respect to red matte boat at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31faf2d1e9b49a4f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) smooth skin toe at center (B) matte skin toe at upper center (C) matte skin toe at center (D) smooth skin foot at center" }, { "from": "gpt", "value": "(B) matte skin toe at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f904343ec1f487d0.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown stone castle at center have a lesser width compared to black metal fence at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9dedd8ef3dd907e.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden slats at center have a greater width compared to metallic wire at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, wooden slats at center might be narrower than metallic wire at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/157b2cd4f1698104.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of floral pajamas at left in relation to shiny plastic toy at left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f66c5b7081ccc7d3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) yellow fabric table at center (B) matte white coat at upper right (C) orange tank top at upper left" }, { "from": "gpt", "value": "(B) matte white coat at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfb4fc117b8c1a83.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte phone at center thinner than blue glossy text message at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black matte phone at center is not thinner than blue glossy text message at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/550de0a70a68fd41.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.814, 0.655) (B) (0.513, 0.495) (C) (0.204, 0.325)" }, { "from": "gpt", "value": "(C) (0.204, 0.325)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c8cac90b06087f8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) furry gray wolf at center right (B) gold textured fabric at center" }, { "from": "gpt", "value": "(B) gold textured fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4065a56807445904.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.463, 0.547) (B) (0.611, 0.295) (C) (0.855, 0.392)" }, { "from": "gpt", "value": "(C) (0.855, 0.392)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66659a83c03304e6.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the beige cotton shirt at center? Choose from: (A) beige fabric umbrella at center (B) sunglasses at upper center" }, { "from": "gpt", "value": "(B) sunglasses at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/874bc360481ae78b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray pants at center is smaller than dark gray t-shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, dark gray pants at center might be larger than dark gray t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/490914238bf23ea1.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) pink fabric doll at right (B) striped fabric doll at center" }, { "from": "gpt", "value": "(B) striped fabric doll at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a309666dbb084b1.jpg", "conversations": [ { "from": "human", "value": "\nDoes beige concrete opera house at left have a greater width compared to striped shirt at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, beige concrete opera house at left has a greater width compared to striped shirt at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1fc1d11b34b02c35.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.574, 0.928) (B) (0.460, 0.850)" }, { "from": "gpt", "value": "(A) (0.574, 0.928)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca5b889b4ec6a21d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.940, 0.502) (B) (0.590, 0.922)" }, { "from": "gpt", "value": "(B) (0.590, 0.922)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1913746abf48d55.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte black helicopter at left in relation to red fabric helmet at upper right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbf1a73dee1b474e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte t-shirt at center is smaller than black matte shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, black matte t-shirt at center occupies less space than black matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bbbf3b3c29aa1c0c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.599, 0.525) (B) (0.671, 0.680) (C) (0.881, 0.637) (D) (0.972, 0.928)" }, { "from": "gpt", "value": "(C) (0.881, 0.637)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c3b7935e7e50925.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) blue water at lower center (B) smooth stone hillside at center" }, { "from": "gpt", "value": "(A) blue water at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c710e29f2c9929c6.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown leather jacket at center further to the viewer compared to white paper cup at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f830f82c15c4654f.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of green leafy tree at right in reference to pink fabric flower at left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dedbf50738256cfb.jpg", "conversations": [ { "from": "human", "value": "\nDoes purple puffy jacket at center appear on the left side of reflective plastic goggles at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, purple puffy jacket at center is not on the left side of reflective plastic goggles at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa1557276a523579.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) denim shorts at lower right (B) green fabric jacket at center" }, { "from": "gpt", "value": "(B) green fabric jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/beef1091bb926032.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.482, 0.484) (B) (0.198, 0.556)" }, { "from": "gpt", "value": "(A) (0.482, 0.484)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4f196d645bb56bf.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray textured salamander at center have a lesser width compared to black and white striped salamander at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, gray textured salamander at center is not thinner than black and white striped salamander at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89b66837882ed890.jpg", "conversations": [ { "from": "human", "value": "\nIs blonde hair at center closer to camera compared to shiny blue dress at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is in front of shiny blue dress at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fc2fb549bd4d66a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) shiny red bicycle at upper center (B) wooden picture frame at upper right (C) matte black picture frame at upper left" }, { "from": "gpt", "value": "(A) shiny red bicycle at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7299fb273a53289.jpg", "conversations": [ { "from": "human", "value": "\nIs white plastic sign at upper right further to camera compared to white plastic sign at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white plastic sign at upper right is in front of white plastic sign at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69607a5ac675c691.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue jeans at center have a larger size compared to matte red shirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, dark blue jeans at center is not larger than matte red shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0694576b5509d85f.jpg", "conversations": [ { "from": "human", "value": "\nDoes black car at left have a lesser width compared to green leafy tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21d22d04a1bc6547.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden walkway at center come behind blue denim jeans at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89232df12c6ff52d.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of smooth concrete water at lower center in relation to rusty metal bridge at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d81ef9d2cd39986a.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the white plastic license plate at rear among (A) glossy black hatchback at center (B) snowy mountain range at upper center?" }, { "from": "gpt", "value": "(B) snowy mountain range at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c6733bd815640bd.jpg", "conversations": [ { "from": "human", "value": "\nDoes floral print scarf at center come behind leopard print scarf at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is behind leopard print scarf at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00793d4993c9069d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if translucent yellow bulb at center is positioned below matte black shirt at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, translucent yellow bulb at center is not below matte black shirt at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c938234fe53c16f.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton shirt at center above matte black car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white cotton shirt at center is not above matte black car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fef2a29c4eeae16.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte jacket at center is positioned above green felt hat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green matte jacket at center is not above green felt hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ce663a00f83d40c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the green reflective lenses at center? (A) silky yellow shirt at right (B) matte brown vest at left (C) shiny gold vest at center" }, { "from": "gpt", "value": "(C) shiny gold vest at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a421645a7b1af84c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the green matte pole at center? Choose among these: (A) green matte signpost at center (B) white plastic sign at center" }, { "from": "gpt", "value": "(B) white plastic sign at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/989ba931583e0bdb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.362, 0.727) (B) (0.384, 0.736)" }, { "from": "gpt", "value": "(B) (0.384, 0.736)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db4125826049d792.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fabric tent at center have a lesser width compared to yellow matte taxi at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white fabric tent at center's width is not less than yellow matte taxi at lower left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a53346db04edef7c.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte herb at center have a smaller size compared to brown matte coriander seeds at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42ad8446d87fad01.jpg", "conversations": [ { "from": "human", "value": "\nIs knit sweater at left further to the viewer compared to matte red sweater at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, knit sweater at left is in front of matte red sweater at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e092f79c47f09927.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.436, 0.361) (B) (0.267, 0.741)" }, { "from": "gpt", "value": "(A) (0.436, 0.361)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c149716a9cf4abad.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the white cotton dress at center? Choose among these: (A) white fabric dress at center (B) polka dot fabric dress at center (C) matte pink swimsuit at center" }, { "from": "gpt", "value": "(A) white fabric dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f150183e94af02c.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the black suit at center? (A) white lace dress at center (B) leather-like brown chair at center-right (C) black matte dress at lower left (D) black matte leggings at lower center" }, { "from": "gpt", "value": "(C) black matte dress at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1686cb2579bede40.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the blue fabric shirt at center? Choose from: (A) dark gray fabric jacket at center (B) brown stone pavement at lower center (C) blue printed shorts at lower left" }, { "from": "gpt", "value": "(C) blue printed shorts at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/011037b6a9ac1be1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.605, 0.356) (B) (0.881, 0.959)" }, { "from": "gpt", "value": "(B) (0.881, 0.959)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/464eb07ed95c5266.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent glass mannequin torso at center smaller than smooth skin torso at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, transparent glass mannequin torso at center is not smaller in size than smooth skin torso at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6ed0f8fafcc2391.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is green leafy tree at center located relative to metallic blue boat at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e7ad721c71e475c.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy shirt at left have a larger size compared to silky purple dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white glossy shirt at left has a larger size compared to silky purple dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9dd6b1f2f99fbb39.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) white marble fountain at center (B) brown stone statue at center, is positioned closest to the granite column at center?" }, { "from": "gpt", "value": "(A) white marble fountain at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4f31b0bc48e6748.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) gray fabric shirt at center (B) matte brown shirt at left (C) dark gray hoodie at lower left" }, { "from": "gpt", "value": "(B) matte brown shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a52b468f8de0970.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the black painted wood fireplace at center? (A) matte wooden picture frame at upper center (B) brown wooden barrel at left (C) smooth dark wood mantle at upper center (D) brown wooden chair at lower left" }, { "from": "gpt", "value": "(C) smooth dark wood mantle at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e202b4a3eff624b1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) brown rough bark tree at left (B) brown bark tree at right" }, { "from": "gpt", "value": "(B) brown bark tree at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bade2bb2ab30a56.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue paperboard at upper right come behind woven straw lion at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d675dc1cefd89d1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.715, 0.369) (B) (0.328, 0.817)" }, { "from": "gpt", "value": "(A) (0.715, 0.369)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93c944d5845c5fff.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) black matte uniform at center (B) blue uniform shirt at center" }, { "from": "gpt", "value": "(B) blue uniform shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/110ba0ab81044186.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.501, 0.717) (B) (0.615, 0.198) (C) (0.351, 0.498)" }, { "from": "gpt", "value": "(A) (0.501, 0.717)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c886a73433b5ac34.jpg", "conversations": [ { "from": "human", "value": "\nIs plaid shirt at center to the right of plaid cotton shirt at left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, plaid shirt at center is to the right of plaid cotton shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7f946905ae6fe97.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.944, 0.963) (B) (0.882, 0.406) (C) (0.210, 0.727)" }, { "from": "gpt", "value": "(C) (0.210, 0.727)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/deb83200336f762b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark brown leather jacket at center is thinner than matte black jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, dark brown leather jacket at center has a lesser width compared to matte black jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d86068ab1c48078c.jpg", "conversations": [ { "from": "human", "value": "\nDoes stone arches at center have a greater width compared to stone column at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of stone arches at center exceeds that of stone column at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/953c97f4f109ac7d.jpg", "conversations": [ { "from": "human", "value": "\nIs brown gravel track at center to the right of stone arch bridge at upper center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, brown gravel track at center is to the left of stone arch bridge at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e5cfaa84bfa279e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.674, 0.447) (B) (0.413, 0.463) (C) (0.606, 0.722) (D) (0.739, 0.289)" }, { "from": "gpt", "value": "(C) (0.606, 0.722)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f87e0844d67fc811.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the white cotton beekeeper suit at center? (A) weathered wood beehive at right (B) teal fabric vest at center (C) rusty corrugated metal hut at upper center" }, { "from": "gpt", "value": "(B) teal fabric vest at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb28cc38a1a765f2.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.877, 0.620) (B) (0.841, 0.631) (C) (0.392, 0.456) (D) (0.245, 0.609)" }, { "from": "gpt", "value": "(A) (0.877, 0.620)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21f3c167dc39791a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte yellow t-shirt at center is thinner than black bandana at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac1d967413edc0ad.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.263, 0.353) (B) (0.222, 0.469) (C) (0.201, 0.359) (D) (0.778, 0.461)" }, { "from": "gpt", "value": "(A) (0.263, 0.353)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6c6c1d6101fece8.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at upper right have a larger size compared to green leafy tree at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green leafy tree at upper right has a larger size compared to green leafy tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a4ce7c5dd38566f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red and white fabric banner at center is smaller than green fabric sign at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, red and white fabric banner at center might be larger than green fabric sign at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd5f1d8f7f1e06ea.jpg", "conversations": [ { "from": "human", "value": "\nDoes light blue fabric shirt at center come in front of red jacket at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, light blue fabric shirt at center is in front of red jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39a5b2cc9a8e5a53.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown plastic bench at center appear under tan plastic bench at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64f0c852bd9083aa.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is pink fabric shirt at center located relative to white shirt at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a4069a9b8cc3a95.jpg", "conversations": [ { "from": "human", "value": "\nIs black gravel at center positioned behind teal glossy fence at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black gravel at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/417a35983fa0002a.jpg", "conversations": [ { "from": "human", "value": "\nIs brown wooden door at center above red painted text at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5f57c489ec07691.jpg", "conversations": [ { "from": "human", "value": "\nIs bare branches at center wider than clear glass window at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fc9172723ddd74a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black jersey at center is positioned to the left of matte gray jersey at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black jersey at center is to the left of matte gray jersey at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8148c52b73f1b483.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric flag at center thinner than gray knit sweater at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, blue fabric flag at center might be wider than gray knit sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/383c197f129c0559.jpg", "conversations": [ { "from": "human", "value": "\nIs navy blue jersey at center to the right of matte white football at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, navy blue jersey at center is to the right of matte white football at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f4a55e9bbcb1940.jpg", "conversations": [ { "from": "human", "value": "\nDoes printed fabric dress at left appear on the left side of maroon and white striped fabric hat at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, printed fabric dress at left is to the left of maroon and white striped fabric hat at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04db1398cd68e59b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.303, 0.533) (B) (0.862, 0.681) (C) (0.354, 0.842)" }, { "from": "gpt", "value": "(C) (0.354, 0.842)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ed89f62948775ad.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brownsmoothhair at left is positioned above brownhair at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b75a52a31956cac.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.837, 0.270) (B) (0.626, 0.955)" }, { "from": "gpt", "value": "(A) (0.837, 0.270)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3dfcfa9f8eccc3de.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.535, 0.495) (B) (0.063, 0.611)" }, { "from": "gpt", "value": "(A) (0.535, 0.495)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ffdb3e5e6069080.jpg", "conversations": [ { "from": "human", "value": "\nIs green textured tree trunk at upper right smaller than green textured tree trunk at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, green textured tree trunk at upper right might be larger than green textured tree trunk at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d42727e3055c707f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.727, 0.933) (B) (0.639, 0.309) (C) (0.218, 0.672) (D) (0.872, 0.675)" }, { "from": "gpt", "value": "(C) (0.218, 0.672)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df9e582d51029b18.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.331, 0.605) (B) (0.579, 0.473)" }, { "from": "gpt", "value": "(B) (0.579, 0.473)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76d8f99af20be64a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) neon green fabric shirt at center (B) green reflective sunglasses at center (C) yellow matte sunglasses at center (D) neon pink leggings at center" }, { "from": "gpt", "value": "(D) neon pink leggings at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1497b0a719ea786.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue metallic bus stop at lower left appear over wooden spire at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, blue metallic bus stop at lower left is below wooden spire at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2b2303ef8e5344c.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white plastic alarm clock at center located relative to black matte digital clock at left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ba5798c25cbdebb.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the yellow ombre blouse at lower right from the following options: (A) matte paper poster at center (B) white fabric canopy at upper right (C) floral-patterned fabric at lower right?" }, { "from": "gpt", "value": "(B) white fabric canopy at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/298cebc2f5b45c83.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green leafy tree at center located in relation to brown gravel path at center in the image? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ff28469054ade9c.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton crowd at lower center below blue fabric shirt at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ebaa39f83dd98f3.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.093, 0.383) (B) (0.789, 0.252) (C) (0.699, 0.330)" }, { "from": "gpt", "value": "(A) (0.093, 0.383)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/220ae97e2b6364b2.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the bronze statue at upper right among (A) white marble statue at upper right (B) gray stone angel at center (C) beige stone statue at center-left (D) polished stone statue at center?" }, { "from": "gpt", "value": "(D) polished stone statue at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d3a60b2a8b207bb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white fabric at center is positioned to the left of iridescent glass chandelier at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white fabric at center is not on the left side of iridescent glass chandelier at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ad1403dc01c7824.jpg", "conversations": [ { "from": "human", "value": "\nIs brown striped duck at right above dark brown feathers at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, brown striped duck at right is located above dark brown feathers at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/105f8d44e6b3f8ec.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.933, 0.534) (B) (0.667, 0.398)" }, { "from": "gpt", "value": "(A) (0.933, 0.534)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71e0e19d1a93d700.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray stone statue at upper right is positioned below gray stone statue at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/483913e6ef282ae0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.431, 0.431) (B) (0.130, 0.419)" }, { "from": "gpt", "value": "(B) (0.130, 0.419)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7599bf8b6ea4c3fd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.016, 0.366) (B) (0.219, 0.753) (C) (0.853, 0.319)" }, { "from": "gpt", "value": "(A) (0.016, 0.366)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/befb4b03f877a776.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the blue denim jacket at center from the following options: (A) light blue fabric jacket at center (B) dark brown leather jacket at center?" }, { "from": "gpt", "value": "(A) light blue fabric jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c867c12a7cea11e0.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the green patinated bronze statue at lower left from the following options: (A) bronze statue at lower left (B) blue striped dome at center?" }, { "from": "gpt", "value": "(A) bronze statue at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/391bb732c0a9796b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.427, 0.756) (B) (0.626, 0.002)" }, { "from": "gpt", "value": "(B) (0.626, 0.002)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f3717388f53fa34.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte beige tank top at center located in relation to matte black jacket at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b25faaa6d25a6c0b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green grassy field at center (B) rugged stone mountain at upper center" }, { "from": "gpt", "value": "(A) green grassy field at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/288e8e9ee0f3e351.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gold earring at center further to camera compared to gold wire mesh earring at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of gold wire mesh earring at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be4f85d29251f274.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the black cotton shirt at center? (A) black wool coat at center (B) maroon striped tie at right (C) dark gray suit at center" }, { "from": "gpt", "value": "(C) dark gray suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41d8793e8e16624d.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the satin brown cookies at center among (A) matte yellow cookies at center-left (B) shiny chocolate cookies at center (C) golden brown cookie at center (D) smooth porcelain baby at center?" }, { "from": "gpt", "value": "(B) shiny chocolate cookies at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df0b8e100177fc64.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) shiny red drum at center (B) leather drum at right (C) matte red drum at center (D) fur-like brown drum at center" }, { "from": "gpt", "value": "(C) matte red drum at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4f603d4e2657c96.jpg", "conversations": [ { "from": "human", "value": "\nWhere is wooden bench at center located in relation to matte red shirt at right in the image? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/288eff797ecdd991.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark blue water at center is positioned to the right of green matte container ship at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dark blue water at center is not to the right of green matte container ship at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8bf2f7af6c7a3c0.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.611, 0.583) (B) (0.646, 0.650) (C) (0.608, 0.647)" }, { "from": "gpt", "value": "(B) (0.646, 0.650)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24e7b0a2c8e2cac8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) plaid shirt at center (B) pink glossy plate at center" }, { "from": "gpt", "value": "(A) plaid shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a0dee389604caa0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) blue shirt at upper right (B) dark green vest at left (C) white paper at center (D) black shirt at center" }, { "from": "gpt", "value": "(C) white paper at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85155f178488c4f8.jpg", "conversations": [ { "from": "human", "value": "\nIs white stone stairs at left positioned in front of black matte clothing at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2912b14b67229857.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.693, 0.244) (B) (0.774, 0.641) (C) (0.589, 0.316) (D) (0.810, 0.550)" }, { "from": "gpt", "value": "(A) (0.693, 0.244)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3158ccefb9c018d5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white glossy bridge at center (B) smooth brown water at lower center (C) blue matte sailboat at right" }, { "from": "gpt", "value": "(A) white glossy bridge at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96cb0472e7dd1631.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.940, 0.630) (B) (0.236, 0.259)" }, { "from": "gpt", "value": "(A) (0.940, 0.630)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d38145c56c0eb47c.jpg", "conversations": [ { "from": "human", "value": "\nWhere is patterned fabric dress at right located in relation to white cloth-covered table at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d429a71b585e658e.jpg", "conversations": [ { "from": "human", "value": "\nWhere is silhouette branches at center located in relation to black matte hut at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37f0080a88d573a0.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of dark blue uniform at right in reference to green metal train track at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00e3993db63e5dd1.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) metallic construction crane at upper center (B) matte glass skyscraper at upper left (C) gold glass tower at center" }, { "from": "gpt", "value": "(B) matte glass skyscraper at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de050afb996bce13.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte scarf at left below striped knit sweater at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, black matte scarf at left is above striped knit sweater at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ecc9f69caff2137.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) brown bark tree at left (B) green painted wood bench at center" }, { "from": "gpt", "value": "(A) brown bark tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06dea8ad35f2adc2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) dark fabric dress at center (B) light green t-shirt at center" }, { "from": "gpt", "value": "(A) dark fabric dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b1a9b78973bb370.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black suit at left is positioned below blue fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte black suit at left is not positioned below blue fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c57ac29ef4fee451.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth concrete pavement at center positioned behind matte black backpack at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, smooth concrete pavement at center is in front of matte black backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b44b2d04092252e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if weathered wood barn door at center is smaller than blue denim jumpsuit at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, weathered wood barn door at center is not smaller than blue denim jumpsuit at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39e8873dc0b7fd90.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte black backpack at center (B) blue matte jacket at upper left (C) gray matte jacket at center (D) pink fabric pants at center" }, { "from": "gpt", "value": "(B) blue matte jacket at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3eebf3620da1ecb2.jpg", "conversations": [ { "from": "human", "value": "\nIs brown leather jacket at lower right smaller than green plastic canoe at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, brown leather jacket at lower right has a smaller size compared to green plastic canoe at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3caeb0c92a26635c.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black car at center to the right of matte silver car at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find matte black car at center to the right of matte silver car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dff640713094abb0.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte jeep at center bigger than black plastic license plate at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white matte jeep at center has a larger size compared to black plastic license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5a7c48c760d0cf4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.623, 0.647) (B) (0.747, 0.505) (C) (0.384, 0.736)" }, { "from": "gpt", "value": "(C) (0.384, 0.736)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f489f55b8ea8a96.jpg", "conversations": [ { "from": "human", "value": "\nDoes white concrete column at center appear on the left side of white smooth column at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white concrete column at center is to the left of white smooth column at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18db8c22ff694ef4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte sign at center is positioned to the left of metallic silver sedan at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white matte sign at center is positioned on the left side of metallic silver sedan at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f3a91bfec299be9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray fleece jacket at left is wider than plaid fabric shirt at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of dark gray fleece jacket at left exceeds that of plaid fabric shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4edc86e38ae5c5f.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center further to camera compared to green matte tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a96983eb26442dc6.jpg", "conversations": [ { "from": "human", "value": "\nIs skinny white leg at center above pink smooth foot at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, skinny white leg at center is above pink smooth foot at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9758da28f98e114.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) glossy water at center (B) green mossy hillside at left" }, { "from": "gpt", "value": "(B) green mossy hillside at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45b88e2b20dc4886.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the dark brown hair at lower left among (A) white fabric sail at center (B) silver metallic mast at center?" }, { "from": "gpt", "value": "(B) silver metallic mast at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bad3ea93938dae2.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is black matte tank top at center located relative to matte black sunglasses at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0653dda9cff15680.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) white fluffy cloud at upper center (B) green grassy field at lower center" }, { "from": "gpt", "value": "(B) green grassy field at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bd4b6816c935afa.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the glassy steel skyscraper at right? Choose among these: (A) green leafy tree at lower center (B) green leafy tree at lower left (C) green leafy tree at center (D) glassy steel skyscraper at center" }, { "from": "gpt", "value": "(D) glassy steel skyscraper at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d09caa8f07c78c99.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center smaller than white matte t-shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b430e6aa4c127b8d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.738, 0.597) (B) (0.902, 0.781)" }, { "from": "gpt", "value": "(A) (0.738, 0.597)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8217534c1268cbc8.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black cards at left lie behind golden brown crumbly cookie at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black cards at left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcbec7b8db778257.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the black matte t-shirt at center? Choose among these: (A) black plastic microphone at center (B) black matte/soft skin at center" }, { "from": "gpt", "value": "(A) black plastic microphone at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/485947d7d8c79c60.jpg", "conversations": [ { "from": "human", "value": "\nWhere is brown fabric purse at center located in relation to matte black purse at left in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6848ac2f433bf457.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the white glossy microwave at right? (A) white plastic water dispenser at right (B) black matte exhaust hood at upper left (C) stainless steel sink at center" }, { "from": "gpt", "value": "(B) black matte exhaust hood at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/896309dde87ffc9e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.947, 0.609) (B) (0.960, 0.886) (C) (0.160, 0.392)" }, { "from": "gpt", "value": "(C) (0.160, 0.392)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ae000f8a4456707.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is green mossy rock at left located relative to green mossy rock at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08c56e12a6630306.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.525, 0.573) (B) (0.310, 0.597) (C) (0.181, 0.858) (D) (0.781, 0.591)" }, { "from": "gpt", "value": "(C) (0.181, 0.858)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/558d35bef198fd97.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny red uniform at center positioned in front of red velvet uniform at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a52f67c9acd80888.jpg", "conversations": [ { "from": "human", "value": "\nIs coarse fabric jacket at right positioned behind denim jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of denim jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e37b2e306708ea95.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent water at center have a smaller size compared to white matte pelican at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, transparent water at center occupies less space than white matte pelican at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09e583a1ead37bbf.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) brown leather shoes at center (B) natural wood tower at center" }, { "from": "gpt", "value": "(B) natural wood tower at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fadef24d9c25e6c8.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the black matte sign at upper center? (A) metallic gray rail at lower center (B) metallic pole at upper left" }, { "from": "gpt", "value": "(B) metallic pole at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/127ceffbd5fcc809.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.291, 0.528) (B) (0.517, 0.758) (C) (0.476, 0.503) (D) (0.246, 0.316)" }, { "from": "gpt", "value": "(C) (0.476, 0.503)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1715089a7d99ab7.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy stream at lower center have a lesser width compared to dark blue shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green leafy stream at lower center's width is not less than dark blue shirt at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47706ac61cd5d8b5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) blue matte boat at center (B) blue water at center, is positioned farthest from the white matte hut at center?" }, { "from": "gpt", "value": "(B) blue water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1628cea87a88e49.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.188, 0.536) (B) (0.670, 0.652) (C) (0.817, 0.677)" }, { "from": "gpt", "value": "(A) (0.188, 0.536)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/993ae061e6f33d78.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) yellow metal sign at center (B) yellow matte diamond at center" }, { "from": "gpt", "value": "(A) yellow metal sign at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0270400677cf2497.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if fuzzy black and white plush at left is thinner than black plush panda at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, fuzzy black and white plush at left has a lesser width compared to black plush panda at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93d0b490c931c8c2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) rubberized yellow balloon at upper center (B) light brown shirt at upper center (C) black matte jacket at center" }, { "from": "gpt", "value": "(B) light brown shirt at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6306712c37d6390.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white wooden sailboat at center (B) frosted glass tree at left (C) blue glassy water at lower left" }, { "from": "gpt", "value": "(C) blue glassy water at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c79d87e368bfeec2.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of brown rough bark tree at upper center in relation to gray matte kangaroo at upper center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/886d1793b0f1a2dd.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black fabric at center is positioned below denim jeans at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black fabric at center is not positioned below denim jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdad20dc371fe673.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.875, 0.727) (B) (0.060, 0.942)" }, { "from": "gpt", "value": "(A) (0.875, 0.727)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a486bd07b63d49f4.jpg", "conversations": [ { "from": "human", "value": "\nDoes white rubber finish line at center appear over white plastic tennis racket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, white rubber finish line at center is below white plastic tennis racket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6eda05ef49c099ef.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark gray water at center located in relation to gray smooth whale at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e07e69e60ce27603.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white cotton shirt at upper right (B) white plastic train at lower left" }, { "from": "gpt", "value": "(A) white cotton shirt at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f53df9f5c6d5e126.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.150, 0.431) (B) (0.379, 0.542) (C) (0.256, 0.963)" }, { "from": "gpt", "value": "(C) (0.256, 0.963)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f99d8852d906e4a6.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the khaki cotton shirt at right? (A) metallic blue shirt at center (B) metallic purple car at center (C) purple metallic car at center" }, { "from": "gpt", "value": "(A) metallic blue shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63760ce1ea4faadc.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the printed silk blouse at center? Choose among these: (A) printed cotton shirt at center (B) blue lace dress at right (C) white textured cardigan at upper left (D) translucent white dress at center" }, { "from": "gpt", "value": "(C) white textured cardigan at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2db779e1439f29b7.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the black matte nose at center among (A) gray fuzzy beard at center (B) matte orange robe at center?" }, { "from": "gpt", "value": "(B) matte orange robe at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ecef9dd453e1fdfe.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of smooth gray sweater at right in reference to blue striped tie at left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0739ab79afb19da8.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black suit at center wider than striped silk tie at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of matte black suit at center exceeds that of striped silk tie at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b2f79c49bcb1373.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange matte shirt at left appear on the right side of white bread at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, orange matte shirt at left is not on the right side of white bread at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/058c7902828d55c0.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of green leafy fern at lower center in reference to gray stone head at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5b629c620c78c6e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.525, 0.836) (B) (0.442, 0.570) (C) (0.400, 0.637) (D) (0.613, 0.834)" }, { "from": "gpt", "value": "(D) (0.613, 0.834)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da8a34ead9756805.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown furry dog at center is positioned to the right of brown smooth dog at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown furry dog at center is to the right of brown smooth dog at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/079f37779f7da167.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue corrugated metal window at right appear over smooth red corrugated metal at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, blue corrugated metal window at right is not above smooth red corrugated metal at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c7137ad9290aa0e.jpg", "conversations": [ { "from": "human", "value": "\nDoes light brown wood guitar at center have a larger size compared to light blue fabric pants at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, light brown wood guitar at center might be smaller than light blue fabric pants at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03675681667b2632.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte shirt at center wider than cardboard box at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, white matte shirt at center might be narrower than cardboard box at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69347423e2c8af16.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.510, 0.884) (B) (0.733, 0.639)" }, { "from": "gpt", "value": "(B) (0.733, 0.639)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d2d60db6371e330.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of smooth skin hand at center less distant than that of pink matte foot at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7deb0776b84d7e5.jpg", "conversations": [ { "from": "human", "value": "\nDoes beige corduroy jacket at upper left have a greater width compared to matte black suit at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of beige corduroy jacket at upper left exceeds that of matte black suit at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6dbf86ade150c116.jpg", "conversations": [ { "from": "human", "value": "\nDoes rugged stone mountain at center appear on the right side of green leafy bush at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, rugged stone mountain at center is not on the right side of green leafy bush at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb44775a24702511.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue quilted jacket at center is bigger than yellow plastic goggles at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, blue quilted jacket at center has a larger size compared to yellow plastic goggles at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d2b7648e33cedcd.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of pink matte shirt at center less distant than that of pink fabric headband at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is behind pink fabric headband at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/900579ea52fc8a47.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.204, 0.556) (B) (0.820, 0.803)" }, { "from": "gpt", "value": "(A) (0.204, 0.556)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/276a498ed04e3157.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white fluffy snow at center located relative to wooden steps at lower right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7aeaeffd320372bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.769, 0.908) (B) (0.483, 0.920)" }, { "from": "gpt", "value": "(A) (0.769, 0.908)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c47ea476213d0121.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte shirt at center have a larger size compared to blue fleece jacket at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white matte shirt at center is bigger than blue fleece jacket at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21780ed137a5d15c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) clear glass wine glass at left (B) smooth beige shirt at center" }, { "from": "gpt", "value": "(B) smooth beige shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bd9358152666e4c.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is green grassy field at lower center located relative to shiny black dog at lower center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f1cdd89928f9c10.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at lower right is positioned below brown fur dog at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green grass at lower right is positioned under brown fur dog at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1aab569ca0bfad0f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte white hand at center (B) matte black hand at left (C) matte black hand at center (D) matte black blazer at center" }, { "from": "gpt", "value": "(D) matte black blazer at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d0020b038db6361.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue jersey at center have a lesser width compared to matte yellow helmet at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte blue jersey at center is not thinner than matte yellow helmet at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54b76c31c7da6a6a.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green leafy tree at upper left and matte red bird at center in the image provided, where is green leafy tree at upper left located with respect to matte red bird at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e19fcbd204efdeeb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white porcelain plate at lower left is thinner than wooden handle knife at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white porcelain plate at lower left is not thinner than wooden handle knife at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25b20a7f29a0e625.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.375, 0.836) (B) (0.621, 0.645)" }, { "from": "gpt", "value": "(A) (0.375, 0.836)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0053f4f3a2740a57.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) orange rubber jump rope at lower right (B) matte purple hoodie at center (C) red hoodie at left" }, { "from": "gpt", "value": "(C) red hoodie at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b23e6e6699e59a28.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray fabric at upper right appear on the right side of matte wooden boat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, gray fabric at upper right is to the right of matte wooden boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e5709f3cda42958.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown leafy tree at center come behind asphalt road at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d82dd134533841da.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white matte shirt at upper right (B) yellow glossy helicopter at center" }, { "from": "gpt", "value": "(B) yellow glossy helicopter at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1d03f305aeb30b9.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte boat at center appear over metallic silver boat at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eeca688723553fde.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic silver bicycle at lower center is smaller than metallic gold bicycle at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, metallic silver bicycle at lower center is not smaller in size than metallic gold bicycle at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1d47b80a61e4677.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of matte red bucket at center and green fabric shirt at center in the image provided, where is matte red bucket at center located with respect to green fabric shirt at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a311319327e0556c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.145, 0.042) (B) (0.972, 0.766) (C) (0.611, 0.670)" }, { "from": "gpt", "value": "(B) (0.972, 0.766)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4aa6285a09497bca.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) dark brown leather jacket at lower right (B) red/yellow fabric flag at upper center, is positioned farthest from the dark brown leather coat at lower right?" }, { "from": "gpt", "value": "(B) red/yellow fabric flag at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23f6ef49e88537c0.jpg", "conversations": [ { "from": "human", "value": "\nIs brown wooden bridge at center bigger than blue denim jeans at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, brown wooden bridge at center is larger in size than blue denim jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73c9e7cd06cf5c1a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.450, 0.620) (B) (0.708, 0.466)" }, { "from": "gpt", "value": "(B) (0.708, 0.466)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8254dce495ba46df.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte christmas tree at center above wooden bookshelf at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60001fbc8fb32504.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.893, 0.350) (B) (0.438, 0.397)" }, { "from": "gpt", "value": "(A) (0.893, 0.350)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09a041a06f83e06b.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte/black plastic gear at center to the right of green matte lego brick at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green matte/black plastic gear at center is to the right of green matte lego brick at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2a5e62f268bbf7d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) glossy red hatchback at center (B) metallic silver sedan at lower right (C) shiny silver sedan at left" }, { "from": "gpt", "value": "(A) glossy red hatchback at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d89a5ee199dc22ec.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) gray smooth dolphin at center (B) blue smooth jacket at center" }, { "from": "gpt", "value": "(B) blue smooth jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c86fee2c155fec47.jpg", "conversations": [ { "from": "human", "value": "\nIs bronze statue at center below bronze statue at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, bronze statue at center is positioned under bronze statue at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc6b5aef87b2a6fd.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue fleece jacket at center have a smaller size compared to black plastic camera at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5be8981e4868740.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) blue cotton shirt at center (B) smooth orange fruit at center" }, { "from": "gpt", "value": "(B) smooth orange fruit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b795033c7013d2e8.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at lower left smaller than green leafy tree at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, green leafy tree at lower left occupies less space than green leafy tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67aee1ef1b03c3d4.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny black car at center right smaller than shiny silver sedan at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, shiny black car at center right occupies less space than shiny silver sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/479165c540841092.jpg", "conversations": [ { "from": "human", "value": "\nDoes green mossy stone at upper center have a larger size compared to brown wooden plank at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green mossy stone at upper center has a larger size compared to brown wooden plank at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53998ecf6d58115a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.971, 0.867) (B) (0.200, 0.503)" }, { "from": "gpt", "value": "(B) (0.200, 0.503)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98bb27d9d60e6155.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny dark green car at right have a larger size compared to green plastic goggles at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, shiny dark green car at right is bigger than green plastic goggles at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f0e6a198a8c0aff.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte plastic monitor at center (B) white plastic machine at center" }, { "from": "gpt", "value": "(B) white plastic machine at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac8dd214e2a62066.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the blonde hair at center? (A) black leather jacket at left (B) black leather jacket at center (C) smooth brown hair at center (D) blue denim jacket at upper right" }, { "from": "gpt", "value": "(C) smooth brown hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c02b5cb00e836a4a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.306, 0.567) (B) (0.784, 0.694) (C) (0.661, 0.812)" }, { "from": "gpt", "value": "(C) (0.661, 0.812)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0b23cd5da08e10b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if silky blue fabric dress at center is smaller than matte gold head at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, silky blue fabric dress at center might be larger than matte gold head at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5b4be57e5db0703.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.664, 0.948) (B) (0.540, 0.611)" }, { "from": "gpt", "value": "(B) (0.540, 0.611)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2fc7cf36dafa6cb9.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white suede sneaker at center in reference to white canvas shoe at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a563926cf1f34052.jpg", "conversations": [ { "from": "human", "value": "\nIs multicolored denim shorts at center to the left of white paper sign at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, multicolored denim shorts at center is not to the left of white paper sign at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d718abbdd06c704.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.669, 0.353) (B) (0.331, 0.334)" }, { "from": "gpt", "value": "(B) (0.331, 0.334)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5debfb98575f7bf5.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center appear on the left side of metallic glass cable car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, green grass at center is not on the left side of metallic glass cable car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b44798b575b1df42.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny black van at lower left below light blue denim shorts at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1099c5b8c8570aab.jpg", "conversations": [ { "from": "human", "value": "\nIs bronze statue at center thinner than greenish-blue water at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, bronze statue at center has a lesser width compared to greenish-blue water at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/523d5e0f70892b67.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.877, 0.755) (B) (0.654, 0.356)" }, { "from": "gpt", "value": "(A) (0.877, 0.755)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ec31d8901be59a4.jpg", "conversations": [ { "from": "human", "value": "\nDoes white stone church at center lie in front of white stone church at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of white stone church at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5be63954b447b80a.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the matte green shirt at left from the following options: (A) yellow matte table at center (B) light beige fabric shirt at center (C) khaki pants at center?" }, { "from": "gpt", "value": "(A) yellow matte table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99887ed938e44e9b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.615, 0.719) (B) (0.817, 0.722) (C) (0.606, 0.333)" }, { "from": "gpt", "value": "(B) (0.817, 0.722)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78266e6efab269ad.jpg", "conversations": [ { "from": "human", "value": "\nDoes glossy glass tower at center appear on the right side of transparent glass tower at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, glossy glass tower at center is to the right of transparent glass tower at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f1a65bfcfb9ae4e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.567, 0.467) (B) (0.436, 0.350)" }, { "from": "gpt", "value": "(B) (0.436, 0.350)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f6ad48c80701a70.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the clear plastic glasses at center? (A) black plastic tablet at center (B) wooden table at center (C) rainbow knitted hat at center" }, { "from": "gpt", "value": "(B) wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b195e88931875276.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the black plastic phone at upper center? Choose from: (A) gray bark tree at left (B) striped wool scarf at center (C) silver metallic car at center" }, { "from": "gpt", "value": "(B) striped wool scarf at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b86640aebeaceba.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) matte black jersey at center (B) black matte cycling jersey at left (C) yellow matte bicycle handlebar at center" }, { "from": "gpt", "value": "(A) matte black jersey at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b9ecedf1ad65ec2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.322, 0.655) (B) (0.864, 0.820) (C) (0.147, 0.225)" }, { "from": "gpt", "value": "(C) (0.147, 0.225)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62881548dc295df6.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte green uniform at center appear on the right side of metallic wristwatch at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte green uniform at center is not to the right of metallic wristwatch at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b63832c434028a5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green lego dragon at center is positioned to the right of white water at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green lego dragon at center is not to the right of white water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/032f01960ad7eda1.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the smooth blonde hair at upper right? (A) black matte shirt at center (B) black matte boy at left" }, { "from": "gpt", "value": "(B) black matte boy at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f62647ae4b95b21.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of camouflage fabric table at center and camouflage uniform at center in the image provided, where is camouflage fabric table at center located with respect to camouflage uniform at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c380a6d1888c780.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.823, 0.181) (B) (0.444, 0.325)" }, { "from": "gpt", "value": "(B) (0.444, 0.325)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5714e3f6ffe2aa9b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.986, 0.853) (B) (0.258, 0.880) (C) (0.921, 0.522)" }, { "from": "gpt", "value": "(B) (0.258, 0.880)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e343d50f4e47102.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) orange fabric jacket at center (B) black leather jacket at center" }, { "from": "gpt", "value": "(A) orange fabric jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bb2ba201e6cd8f9.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the shiny black bicycle at center among (A) smooth concrete pavement at lower center (B) matte purple shirt at center?" }, { "from": "gpt", "value": "(A) smooth concrete pavement at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8e2c45d660b4278.jpg", "conversations": [ { "from": "human", "value": "\nIs white shirt at center below blue dotted tie at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white shirt at center is positioned under blue dotted tie at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d821ea7480386058.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of brown fur coat at center and fuzzy gray fur coat at center in the image provided, where is brown fur coat at center located with respect to fuzzy gray fur coat at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/001b0625a1435b14.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black satin pants at center is positioned to the left of white matte refrigerator at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, black satin pants at center is to the right of white matte refrigerator at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee59d5e989512597.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.911, 0.917) (B) (0.375, 0.444) (C) (0.205, 0.670)" }, { "from": "gpt", "value": "(A) (0.911, 0.917)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/486621682ab46278.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) white matte shirt at center (B) dark blue suit at left (C) dark brown leather jacket at right" }, { "from": "gpt", "value": "(B) dark blue suit at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/084c13ca5e890006.jpg", "conversations": [ { "from": "human", "value": "\nIs green mossy tree at center below green mossy rock at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5637d94f795e824b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) shiny black hair at upper right (B) white cotton shirt at left" }, { "from": "gpt", "value": "(A) shiny black hair at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4f66922bc910f6d.jpg", "conversations": [ { "from": "human", "value": "\nDoes black velvet hat at upper right have a smaller size compared to matte black suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, black velvet hat at upper right is not smaller in size than matte black suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/950d2f491e59d9ed.jpg", "conversations": [ { "from": "human", "value": "\nIs silhouette man at center positioned behind matte black monitor at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb45ac415aeb5d69.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white paper bag at center (B) black fabric jacket at center (C) white checkered box at center (D) white matte laptop at center" }, { "from": "gpt", "value": "(A) white paper bag at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/039dd0ed14106d32.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.900, 0.106) (B) (0.100, 0.773)" }, { "from": "gpt", "value": "(B) (0.100, 0.773)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62cb47db7fa1e6c0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.522, 0.755) (B) (0.410, 0.425)" }, { "from": "gpt", "value": "(A) (0.522, 0.755)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/652426a75c174b99.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the black polished metal streetlight at center? Select from: (A) metallic pole at center (B) reflective water at lower center" }, { "from": "gpt", "value": "(A) metallic pole at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d971bf1aabd9fed3.jpg", "conversations": [ { "from": "human", "value": "\nIs white snow-covered mountain range at center bigger than smooth gray tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white snow-covered mountain range at center is bigger than smooth gray tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfc279ea34835f55.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white matte/scratch-free whiteboard at upper right (B) matte plastic table at lower center" }, { "from": "gpt", "value": "(A) white matte/scratch-free whiteboard at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b7d5a51201ae86f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white plastic license plate at center (B) matte black trash can at lower left" }, { "from": "gpt", "value": "(B) matte black trash can at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e1e0a5d39fb1119.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow matte bobfloat at lower left in front of dark water at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of dark water at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b18808f817a582e9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green inflatable boat at lower center (B) golden matte dog at lower left" }, { "from": "gpt", "value": "(A) green inflatable boat at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bea4ec1e19f8ec64.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gold quilted dress at upper right is bigger than green cotton shorts at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd77b2161ba9a82e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.125, 0.980) (B) (0.574, 0.959) (C) (0.068, 0.992) (D) (0.214, 0.553)" }, { "from": "gpt", "value": "(D) (0.214, 0.553)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bb95f86f5c14d9c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the white matte sedan at center-right? Select from: (A) yellow matte barricade at center (B) orange plastic barricades at center" }, { "from": "gpt", "value": "(A) yellow matte barricade at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55a2e7ec87835048.jpg", "conversations": [ { "from": "human", "value": "\nIs matte pink shirt at center below white matte shirt at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, matte pink shirt at center is above white matte shirt at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d7a89e438cd9f89.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.911, 0.544) (B) (0.039, 0.847)" }, { "from": "gpt", "value": "(B) (0.039, 0.847)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b72b8075439d0f63.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.457, 0.061) (B) (0.780, 0.905) (C) (0.673, 0.927)" }, { "from": "gpt", "value": "(C) (0.673, 0.927)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75ebcce29e4a1aa0.jpg", "conversations": [ { "from": "human", "value": "\nDoes gold wrought iron fence at center appear over white stone building at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, gold wrought iron fence at center is below white stone building at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e7f201a85809a90.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the green leafy tree at upper left? Choose from: (A) red plastic triangle at upper right (B) red plastic triangle at right" }, { "from": "gpt", "value": "(B) red plastic triangle at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc620ccdf2a4346e.jpg", "conversations": [ { "from": "human", "value": "\nIs light blue denim shorts at center in front of brown leather bag at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of brown leather bag at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13f4c2533a072030.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) dark gray fabric pants at lower right (B) yellow matte bicycle at center (C) matte black shirt at center (D) shiny silver bicycle at center" }, { "from": "gpt", "value": "(A) dark gray fabric pants at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/125082ca4f529174.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the brown leafless tree at upper left from the following options: (A) green leafy tree at upper left (B) bare branches at center?" }, { "from": "gpt", "value": "(A) green leafy tree at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b950679a9645533d.jpg", "conversations": [ { "from": "human", "value": "\nIs gray rock formation at center to the left of dark gray fleece jacket at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find gray rock formation at center to the left of dark gray fleece jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18fb1aff9a3ee01b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) metallic grid tower at left (B) metallic grid tower at center (C) smooth sand at lower center (D) cloudy sky at upper center" }, { "from": "gpt", "value": "(C) smooth sand at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bab97b7da68c07d.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black jacket at lower right smaller than matte black laptop at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, matte black jacket at lower right has a smaller size compared to matte black laptop at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d03e9b60c049efc.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) matte black harnesses at center (B) orange metallic tower at left (C) yellow plastic swing at center" }, { "from": "gpt", "value": "(C) yellow plastic swing at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f2c9800ce9b3eea.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cotton shirt at lower left is positioned to the right of matte black shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white cotton shirt at lower left is positioned on the right side of matte black shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d796566cbf17be3e.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the orange fabric cat bed at center? Choose from: (A) orange fabric bean bag at center (B) black fur cat at center (C) yellow fabric curtain at right (D) black matte cat at center" }, { "from": "gpt", "value": "(C) yellow fabric curtain at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/172fb0d0e63685e2.jpg", "conversations": [ { "from": "human", "value": "\nDoes purple fabric shirt at upper center appear on the left side of yellow translucent juice at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, purple fabric shirt at upper center is to the right of yellow translucent juice at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05b7c3387a3542da.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the black and white striped zebra at lower right? (A) black and white striped zebra nose at lower right (B) black and white striped zebra at left" }, { "from": "gpt", "value": "(A) black and white striped zebra nose at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1cbcff3ace6192a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear water at lower left is smaller than green leafy tree at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, clear water at lower left is not smaller in size than green leafy tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bae087c6e6f63b14.jpg", "conversations": [ { "from": "human", "value": "\nIs black fabric umpire at center closer to camera compared to white matte uniform at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, black fabric umpire at center is in front of white matte uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c85e89da059cde46.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) silver metallic laptop at center (B) silver metallic case at center (C) wooden table at center" }, { "from": "gpt", "value": "(C) wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8849010d7bfa45d9.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fleece jacket at right wider than pink matte leggings at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of blue fleece jacket at right exceeds that of pink matte leggings at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aed1e9118e3cae5a.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark sand at lower center have a larger size compared to black matte swimsuit at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbf4a4c8563f6cad.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte black jacket at right located relative to matte black jacket at upper right? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11c6a95463380254.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the green floral dress at center among (A) gray cotton t-shirt at center (B) gray stone pavement at lower center?" }, { "from": "gpt", "value": "(A) gray cotton t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffa7c06b5a51c395.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.957, 0.562) (B) (0.496, 0.723) (C) (0.579, 0.653)" }, { "from": "gpt", "value": "(A) (0.957, 0.562)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3751418fec919a8d.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy highway at lower right have a greater width compared to yellow matte license plate at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white glossy highway at lower right has a greater width compared to yellow matte license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f22625dcaa21b4a.jpg", "conversations": [ { "from": "human", "value": "\nIs brown leather jacket at center closer to camera compared to light beige shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00456cbee2f9c18c.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glass building at upper left appear under glassy reflective skyscraper at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white glass building at upper left is positioned under glassy reflective skyscraper at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/288af32b921d3ae3.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the silver metallic ladder at right among (A) white matte clock at center (B) white metallic clock at upper center?" }, { "from": "gpt", "value": "(B) white metallic clock at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04d81a573b56029e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the brown stone bell tower at center? Select from: (A) green grass at lower center (B) green leafy tree at lower right" }, { "from": "gpt", "value": "(A) green grass at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/919ce7592a48fa6a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the yellow rubber excavator at center? Select from: (A) green leafy tree at upper center (B) yellow metallic excavator at left" }, { "from": "gpt", "value": "(B) yellow metallic excavator at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23d0b40c77f1aadc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper right is bigger than green leafy grass at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90f7f20adcb680df.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the yellow fabric dress at center among (A) white cotton shirt at upper right (B) wooden dock at right?" }, { "from": "gpt", "value": "(B) wooden dock at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c79bdbd8c59cce2.jpg", "conversations": [ { "from": "human", "value": "\nDoes purple fabric slide at lower left come in front of dark brown hair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, purple fabric slide at lower left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcdb541369567d3e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black hoodie at center is positioned below matte pink plastic deer at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte black hoodie at center is not positioned below matte pink plastic deer at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e05cdf294d7a59ed.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) denim jacket at lower center (B) dark blue jeans at center (C) dark gray suit at center" }, { "from": "gpt", "value": "(B) dark blue jeans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/206d4c2238b9e493.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte black robe at center located relative to black matte robe at left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb53c3edbf23ab90.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.501, 0.548) (B) (0.754, 0.422) (C) (0.454, 0.500)" }, { "from": "gpt", "value": "(C) (0.454, 0.500)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a0817ea8774fc3b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.531, 0.711) (B) (0.337, 0.720)" }, { "from": "gpt", "value": "(A) (0.531, 0.711)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de36a78f48f01a53.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.055, 0.289) (B) (0.486, 0.803)" }, { "from": "gpt", "value": "(A) (0.055, 0.289)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a3cdac97317f3ab.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) green leafy tree at left (B) gray asphalt at lower left, is positioned farthest from the green leafy palm tree at center?" }, { "from": "gpt", "value": "(A) green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a4fe24abac70d1f.jpg", "conversations": [ { "from": "human", "value": "\nDoes light brown wood at center appear under gray plastic monitor at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, light brown wood at center is below gray plastic monitor at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d88340fe3ee388bb.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden staircase at center lie in front of wooden slats at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b2923986045f305.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the black matte shorts at center? Choose among these: (A) matte black smartphone at center (B) black cotton dress at center (C) blonde hair at center" }, { "from": "gpt", "value": "(A) matte black smartphone at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81f8e2f325ceb015.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white fluffy snow at center (B) light brown fur at center (C) fuzzy white dog at center" }, { "from": "gpt", "value": "(C) fuzzy white dog at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3238d3f4926c118d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.358, 0.511) (B) (0.942, 0.163)" }, { "from": "gpt", "value": "(B) (0.942, 0.163)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33bd0cca55eaeb50.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) blue fabric jumpsuit at center (B) silver metallic ladder at center" }, { "from": "gpt", "value": "(A) blue fabric jumpsuit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7323ad219b3e3b1e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.242, 0.527) (B) (0.171, 0.439) (C) (0.053, 0.536)" }, { "from": "gpt", "value": "(B) (0.171, 0.439)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0739b444b2262da5.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte jacket at center have a greater width compared to wooden table at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black matte jacket at center is wider than wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68c0061e4b0dcc80.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte black scarf at right in relation to white knit beanie at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4008fd90dce0f920.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.535, 0.397) (B) (0.353, 0.547) (C) (0.359, 0.425)" }, { "from": "gpt", "value": "(A) (0.535, 0.397)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e64f064624ae8f7.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.949, 0.869) (B) (0.305, 0.853) (C) (0.678, 0.075)" }, { "from": "gpt", "value": "(A) (0.949, 0.869)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/196b28b9deeaba51.jpg", "conversations": [ { "from": "human", "value": "\nDoes terracotta pot at center appear over brown matte pot at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, terracotta pot at center is not positioned above brown matte pot at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a69d0973bd246d0a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) matte black laptop at center (B) matte brown shirt at left (C) purple silk jacket at center" }, { "from": "gpt", "value": "(B) matte brown shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0deacb130e6b090a.jpg", "conversations": [ { "from": "human", "value": "\nDoes white soft fur goat at center have a lesser width compared to white woolen lamb at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a4236a3f938289e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) blue cotton shirt at right (B) matte brown tie at center (C) tan uniform at center (D) tan uniform at left" }, { "from": "gpt", "value": "(B) matte brown tie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf2c562674609fcf.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red jersey at left further to the viewer compared to smooth white shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bec9ac5fe1c57e8f.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black jacket at center appear on the right side of dark blue shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black jacket at center is not to the right of dark blue shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/135b2f5b4de57058.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.486, 0.781) (B) (0.107, 0.766)" }, { "from": "gpt", "value": "(B) (0.107, 0.766)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8028aadf4438cdf7.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.559, 0.475) (B) (0.410, 0.345)" }, { "from": "gpt", "value": "(A) (0.559, 0.475)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a35bcb70810c05a.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is smooth bark tree at center located relative to wooden log cabin at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e96fef00d1707bf.jpg", "conversations": [ { "from": "human", "value": "\nIs black leather chair at lower left above beige fabric chair at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b690b4d4285d51d4.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte black dress at center located in relation to matte black bag at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/663af44bb985976d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.517, 0.578) (B) (0.173, 0.595) (C) (0.067, 0.356)" }, { "from": "gpt", "value": "(A) (0.517, 0.578)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d06ba36f8fb4dedc.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the matte orange helmet at center? Choose among these: (A) matte black construction suit at center (B) matte black jacket at center (C) silver metallic pole at right (D) matte red helmet at center" }, { "from": "gpt", "value": "(C) silver metallic pole at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a045a240c8638901.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) satin metallic car at center (B) matte black jacket at center" }, { "from": "gpt", "value": "(B) matte black jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a132ac7bbb410c16.jpg", "conversations": [ { "from": "human", "value": "\nIs white paper sign at right wider than matte black backpack at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2081353b446de8bc.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the green plastic bin at center? Select from: (A) brown rough bricks at center (B) blue plastic bin at right" }, { "from": "gpt", "value": "(B) blue plastic bin at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1dec08ce362a6140.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green grass at center (B) blue lace dress at lower right" }, { "from": "gpt", "value": "(B) blue lace dress at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2003f753319c4f5a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) metallic silver microphone at center (B) white matte shirt at lower center" }, { "from": "gpt", "value": "(B) white matte shirt at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e88f78f398d7ed4.jpg", "conversations": [ { "from": "human", "value": "\nIs gray hoodie at right wider than gray fabric jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, gray hoodie at right's width does not surpass gray fabric jacket at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91e7ffae57aaea95.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center smaller than smooth concrete path at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green leafy tree at center is not smaller than smooth concrete path at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cc9f05d17818c69.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the matte white blouse at upper center? (A) stone wall at center (B) matte white tank top at center" }, { "from": "gpt", "value": "(B) matte white tank top at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3ed562eb243cc7c.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red car at center in front of orange plastic picnic table at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50a63580123753d5.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of gray gravel at lower left in relation to rusty metal rail at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/447577eed5940799.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black baseball glove at center is positioned to the right of dark green leather glove at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, matte black baseball glove at center is to the left of dark green leather glove at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3752146a1222826.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the matte gray suit at center among (A) black fabric chair at left (B) light brown wood table at center (C) black leather chair at center?" }, { "from": "gpt", "value": "(C) black leather chair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/524d12e91bf012de.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped fabric binoculars at center have a smaller size compared to white painted wood at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, striped fabric binoculars at center is not smaller than white painted wood at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad405f14b670b83c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth skin hand at center is positioned to the right of matte brown purse at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find smooth skin hand at center to the right of matte brown purse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/679c69b1f9d111ec.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden panelled door at right have a larger size compared to denim jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, wooden panelled door at right is larger in size than denim jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b1c966d3c8ba196.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the white tiled tower at upper right? (A) brown textured tower at left (B) brown textured building at left" }, { "from": "gpt", "value": "(A) brown textured tower at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd952930ca7b057e.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown stone statue at upper center have a smaller size compared to polished bronze statue at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, dark brown stone statue at upper center might be larger than polished bronze statue at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a40eb59d3560c715.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the blue striped tie at right? Choose among these: (A) maroon textured tie at left (B) dark blue suit at center (C) dark gray pinstripe suit at left" }, { "from": "gpt", "value": "(A) maroon textured tie at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3283ad6607362b2.jpg", "conversations": [ { "from": "human", "value": "\nDoes sunglasses at left have a smaller size compared to transparent plastic glasses at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, sunglasses at left has a smaller size compared to transparent plastic glasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/faaca79f6fc7a6eb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cotton shirt at center is smaller than purple cotton shirt at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white cotton shirt at center is smaller than purple cotton shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9167bc3b729286ee.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) striped fabric shirt at center (B) white fabric beach chair at upper right (C) blue fabric beach chair at center" }, { "from": "gpt", "value": "(C) blue fabric beach chair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86d4ae50dd198e72.jpg", "conversations": [ { "from": "human", "value": "\nDoes white satin dress at center appear on the left side of black matte dress at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white satin dress at center is not on the left side of black matte dress at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71f2a303cabe0079.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) white fabric skirt at center (B) metallic washboard at center (C) gray concrete pavement at lower center" }, { "from": "gpt", "value": "(C) gray concrete pavement at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3325687bf67295aa.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) blue glossy train at center (B) blue/white plastic train at center" }, { "from": "gpt", "value": "(A) blue glossy train at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00c874833f92eb06.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.280, 0.403) (B) (0.195, 0.125)" }, { "from": "gpt", "value": "(B) (0.195, 0.125)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26454d119d7ea269.jpg", "conversations": [ { "from": "human", "value": "\nDoes purple fabric mat at center have a greater width compared to green fabric street artist at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of purple fabric mat at center exceeds that of green fabric street artist at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9365c12555407e9f.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of white marble column at center less distant than that of dark suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81b4856b7d41a090.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray rough rock at left appear on the right side of green matte tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, gray rough rock at left is to the left of green matte tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b2a15b6525dfca9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) striped cotton shirt at center (B) white glossy table at lower left" }, { "from": "gpt", "value": "(B) white glossy table at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aeebad1b6e028e14.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue jeans at center have a smaller size compared to brown cotton pants at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, dark blue jeans at center is smaller than brown cotton pants at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87422eca163df00e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.682, 0.906) (B) (0.244, 0.667)" }, { "from": "gpt", "value": "(A) (0.682, 0.906)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a90d22f3495a3cd5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) metallic gray bridge at center (B) white matte boat at lower left (C) blue water at lower center" }, { "from": "gpt", "value": "(A) metallic gray bridge at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34959bead13ac12c.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is denim shirt at center located relative to blue denim shirt at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52ec4c5c42fc80c3.jpg", "conversations": [ { "from": "human", "value": "\nIs gray hoodie at left thinner than blue fabric cap at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, gray hoodie at left might be wider than blue fabric cap at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce70975a28bde105.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) light blue striped sweater at lower right (B) green plastic toy at center (C) rubberized red toy at center" }, { "from": "gpt", "value": "(A) light blue striped sweater at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ad4564a1b66de26.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) yellow printed dress at upper left (B) white floral dress at center (C) yellow printed fabric dress at left (D) multicolored striped paper bag at center" }, { "from": "gpt", "value": "(B) white floral dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcd6261e8decd871.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.836, 0.727) (B) (0.137, 0.606)" }, { "from": "gpt", "value": "(A) (0.836, 0.727)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f0061c1ec8dd130.jpg", "conversations": [ { "from": "human", "value": "\nDoes gold sequined dress at center appear on the right side of silver/crystal crown at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, gold sequined dress at center is to the left of silver/crystal crown at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcea41928db67746.jpg", "conversations": [ { "from": "human", "value": "\nDoes gold/black clock at center have a larger size compared to smooth stone spire at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d401c390c1f7b03c.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue sweater at center have a lesser width compared to light brown leather jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, dark blue sweater at center is not thinner than light brown leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be295a93b3592189.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) smooth yellow bun at center (B) pink foam burger at center" }, { "from": "gpt", "value": "(A) smooth yellow bun at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8cb2a5b1463d3a3.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.507, 0.777) (B) (0.001, 0.339)" }, { "from": "gpt", "value": "(A) (0.507, 0.777)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae09c692fdcbcf48.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.544, 0.372) (B) (0.341, 0.908) (C) (0.769, 0.872)" }, { "from": "gpt", "value": "(B) (0.341, 0.908)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63e842d978dd0198.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the soft plush toy at center from the following options: (A) velvet-like red couch at center (B) white matte table at lower center (C) brown textured sock at center?" }, { "from": "gpt", "value": "(B) white matte table at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0b1a39cea73c337.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) orange reflective vest at center (B) green fabric cap at center (C) blue shirt at lower center" }, { "from": "gpt", "value": "(B) green fabric cap at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e992ce629c48c985.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte shirt at center lie in front of floral print fabric top at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of floral print fabric top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58d42ef39d44b7cd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.195, 0.530) (B) (0.833, 0.797) (C) (0.398, 0.542)" }, { "from": "gpt", "value": "(B) (0.833, 0.797)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b21712baad2cc4fe.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte bicycle at lower right wider than blue glossy sedan at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black matte bicycle at lower right is not wider than blue glossy sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4a9f7b288295734.jpg", "conversations": [ { "from": "human", "value": "\nDoes white frosty tree at upper right have a greater width compared to green matte tree at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of white frosty tree at upper right exceeds that of green matte tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3976e507bb991015.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brown wooden cabin at center (B) white fluffy snow at center" }, { "from": "gpt", "value": "(B) white fluffy snow at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de13e4c743602109.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the blue striped tie at left among (A) matte paper poster at center (B) black suit at left (C) wire mesh fence at lower left (D) blue plastic sign at upper center?" }, { "from": "gpt", "value": "(D) blue plastic sign at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5963318301830004.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte table at center is wider than shiny metallic ball at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of white matte table at center exceeds that of shiny metallic ball at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cf9b86a398eabd0.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of black matte shirt at left more distant than that of pink matte shirt at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of pink matte shirt at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e2b4a44d770a295.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark blue shirt at center is thinner than matte black sweater at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dark blue shirt at center is not thinner than matte black sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f68851d2f93089ca.jpg", "conversations": [ { "from": "human", "value": "\nDoes knitted teal sweater at center have a larger size compared to black matte coat at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05a8931f6610ed33.jpg", "conversations": [ { "from": "human", "value": "\nDoes white concrete dock at lower center have a greater width compared to white glossy ferry at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white concrete dock at lower center has a greater width compared to white glossy ferry at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6441948e3c1398e7.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) wooden canoe at center (B) denim jacket at lower right (C) white cotton shirt at right (D) matte black canoe at center" }, { "from": "gpt", "value": "(D) matte black canoe at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66d4246cb1d601cc.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the white matte motorcycle at center? (A) matte yellow kain at center (B) matte gold dress at center" }, { "from": "gpt", "value": "(B) matte gold dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/025899d2103bf10a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) purple matte shirt at lower center (B) white cotton dress at center" }, { "from": "gpt", "value": "(B) white cotton dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc11fd878f352792.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray cotton shirt at center appear on the right side of sandy beach at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find gray cotton shirt at center to the right of sandy beach at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5cf7db31d7fd01a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.191, 0.880) (B) (0.590, 0.616)" }, { "from": "gpt", "value": "(B) (0.590, 0.616)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6297ed4cfab32f3e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy toilet bowl at center is positioned to the right of satin silver sink at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white glossy toilet bowl at center is not on the right side of satin silver sink at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9b8773f44f2b03a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.253, 0.755) (B) (0.810, 0.494)" }, { "from": "gpt", "value": "(B) (0.810, 0.494)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63083f33c5471e31.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of metallic silver bicycle at center in relation to denim jacket at upper left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/575f2fdb632ea497.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center have a lesser width compared to wooden cabin at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/043576899b1ab827.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the orange rubber pacifier at center? Choose from: (A) yellow fleece blanket at center (B) orange rubber pacifier at upper left" }, { "from": "gpt", "value": "(A) yellow fleece blanket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15e771115bba0152.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) blonde hair at lower center (B) maroon fabric shirt at lower center (C) maroon fabric at lower left (D) black matte microphone at center" }, { "from": "gpt", "value": "(A) blonde hair at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a77f776c8c4be868.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark brown wool coat at center is smaller than white cotton t-shirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dark brown wool coat at center is not smaller than white cotton t-shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4c13934561f0dd2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.687, 0.306) (B) (0.572, 0.780) (C) (0.271, 0.847)" }, { "from": "gpt", "value": "(A) (0.687, 0.306)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd1d57a94d04b5e7.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) matte olive green jacket at center (B) green shiny pine tree at right (C) beige plaid coat at center" }, { "from": "gpt", "value": "(C) beige plaid coat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f805305c42e9c500.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) concrete at center (B) striped fabric at center (C) green matte shirt at center (D) black fabric stroller at lower left" }, { "from": "gpt", "value": "(C) green matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31e6912d4cb4751a.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte signboard at center appear over black paper at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9796560164ea9d4f.jpg", "conversations": [ { "from": "human", "value": "\nIs pink gingham dress at center closer to camera compared to white cotton dress at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce33a5e1720f0bf0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.367, 0.461) (B) (0.764, 0.150)" }, { "from": "gpt", "value": "(A) (0.367, 0.461)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6aba8b9366dabc27.jpg", "conversations": [ { "from": "human", "value": "\nDoes black paper at center lie behind gold metallic bear at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c23625f7114e79b0.jpg", "conversations": [ { "from": "human", "value": "\nDoes satin black suit at center lie in front of blue dotted silk tie at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/573ec16024dbe298.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green grass at center and brown textured tree at right in the image provided, where is green grass at center located with respect to brown textured tree at right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38dca42986095fb3.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black leather jacket at center located in relation to brown wool jacket at lower left in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79bd97c2e5ab1768.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is shiny black jacket at left located relative to matte beige jacket at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9b665966a6da13f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the yellow cotton shirt at right? Choose among these: (A) matte blue t-shirt at left (B) blue floral dress at center" }, { "from": "gpt", "value": "(B) blue floral dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2622e5f2f20179fb.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the wooden table at center? (A) white matte shirt at center (B) white fabric shirt at center" }, { "from": "gpt", "value": "(A) white matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2b8173abc3180a4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.444, 0.341) (B) (0.851, 0.280)" }, { "from": "gpt", "value": "(B) (0.851, 0.280)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e661690fcc6cb561.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) brown hair at center (B) blue striped tank top at left" }, { "from": "gpt", "value": "(A) brown hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b5c3d7a87e5ebef.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the smooth gray rock at center? (A) white sandy beach at center (B) green leafy palm tree at left (C) gray rough rock at center" }, { "from": "gpt", "value": "(A) white sandy beach at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d05b1ead289897e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the matte black vest at center? (A) matte black helmet at center (B) black plastic gun at center" }, { "from": "gpt", "value": "(A) matte black helmet at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1580f3a8b79a67f5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.128, 0.503) (B) (0.523, 0.586) (C) (0.675, 0.089)" }, { "from": "gpt", "value": "(A) (0.128, 0.503)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c12bb83e29ab86d7.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at upper right below green leafy tree at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green leafy tree at upper right is positioned under green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28dfda071f1193d5.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fabric shirt at left have a lesser width compared to brown wood table at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, white fabric shirt at left's width is less than brown wood table at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4e709a1a74e3d87.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray suit at left appear over dark blue silk tie at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22ea25a2034ffd8a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.849, 0.950) (B) (0.343, 0.167) (C) (0.833, 0.234) (D) (0.169, 0.886)" }, { "from": "gpt", "value": "(B) (0.343, 0.167)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d358b7f3458638db.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white smooth dome at lower left (B) white smooth tower at center" }, { "from": "gpt", "value": "(A) white smooth dome at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0983610fa0bf760.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.678, 0.594) (B) (0.617, 0.781) (C) (0.864, 0.244)" }, { "from": "gpt", "value": "(B) (0.617, 0.781)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f22d17527d7b7c6.jpg", "conversations": [ { "from": "human", "value": "\nIs red wool coat at center positioned behind black leather jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of black leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3dc35a386b5d6665.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte house at lower center lie in front of black rock cave at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2d61f97633d7224.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown wooden bench at center have a smaller size compared to black wood bench at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, brown wooden bench at center is not smaller than black wood bench at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/971f8e9f0d8cc472.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of orange matte book at center more distant than that of wooden bookshelf at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/501bffb948d0fdab.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the golden textured cloud at center? (A) green asphalt road at center (B) green grassy path at lower center (C) golden-yellow cotton cloud at upper left" }, { "from": "gpt", "value": "(C) golden-yellow cotton cloud at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4d1f7ef1ef98c26.jpg", "conversations": [ { "from": "human", "value": "\nDoes red matte jacket at center appear on the left side of white plastic sign at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find red matte jacket at center to the left of white plastic sign at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b477c745555a25bc.jpg", "conversations": [ { "from": "human", "value": "\nIs blue metallic bicycle at right bigger than white satin dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, blue metallic bicycle at right has a larger size compared to white satin dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7bb1ca1e6ab8415.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray suit at center thinner than gray matte suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, dark gray suit at center might be wider than gray matte suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfb402f9a46fa153.jpg", "conversations": [ { "from": "human", "value": "\nDoes rusty metal window at upper center lie behind brown stone cherub at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea4d7a2e9d8dcc77.jpg", "conversations": [ { "from": "human", "value": "\nIs gray stone face at center positioned at the back of jeans at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is behind jeans at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/893f5331af04ddfc.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth brown pole at right below smooth brown pole at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, smooth brown pole at right is not positioned below smooth brown pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa2e1c6fc32ea7c3.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.905, 0.752) (B) (0.177, 0.645)" }, { "from": "gpt", "value": "(A) (0.905, 0.752)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/985b5fc605048897.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.673, 0.212) (B) (0.724, 0.705) (C) (0.655, 0.020)" }, { "from": "gpt", "value": "(A) (0.673, 0.212)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc201288a3b84ff9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) metallic gray car at center (B) stone church at center" }, { "from": "gpt", "value": "(A) metallic gray car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40870d22b5fcf04e.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte shirt at center have a greater width compared to red fabric backpack at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white matte shirt at center is not wider than red fabric backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54ce028d509a7a62.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of metallic car at center in reference to dark gray fabric man at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a76f73d2a4cf5c7.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green matte tree at center (B) green leafy tree at left (C) smooth gray telegraph pole at center (D) metallic silver car at lower right" }, { "from": "gpt", "value": "(A) green matte tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23e92bf6cf23a89e.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the green grass at center? Choose from: (A) matte gray glove at center (B) dark gray feathers at upper right (C) teal fleece jacket at center" }, { "from": "gpt", "value": "(C) teal fleece jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc0d1feecb53a7a8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the denim jacket at upper center? Select from: (A) green matte shirt at lower right (B) green matte baseball cap at upper left" }, { "from": "gpt", "value": "(B) green matte baseball cap at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1bbbe4da625a8f9.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the black reflective sunglasses at center? (A) green matte shirt at center (B) brown brick clock tower at center (C) white marble clock at upper center" }, { "from": "gpt", "value": "(A) green matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e719a5b095acd135.jpg", "conversations": [ { "from": "human", "value": "\nDoes silhouette palm tree at left lie in front of silhouette palm tree at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b7032a0020b6c09.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) matte blue statue at center (B) blue matte robe at center" }, { "from": "gpt", "value": "(B) blue matte robe at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d20fc4eaec2b33ec.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.153, 0.922) (B) (0.126, 0.575) (C) (0.576, 0.403)" }, { "from": "gpt", "value": "(C) (0.576, 0.403)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eeb1f3f56a4fa508.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.183, 0.566) (B) (0.421, 0.512) (C) (0.686, 0.400)" }, { "from": "gpt", "value": "(A) (0.183, 0.566)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3eb6ebb12a592468.jpg", "conversations": [ { "from": "human", "value": "\nDoes brick-patterned plastic food truck at center have a lesser width compared to white matte jacket at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45a7b9af411983d9.jpg", "conversations": [ { "from": "human", "value": "\nIs bare branches at center above metallic wire at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, bare branches at center is not above metallic wire at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3475a35bb76a1d00.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.396, 0.977) (B) (0.550, 0.492) (C) (0.394, 0.723) (D) (0.046, 0.495)" }, { "from": "gpt", "value": "(B) (0.550, 0.492)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0056adb1d454d015.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white glass door at center in reference to matte white cap at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09b7830c386a5878.jpg", "conversations": [ { "from": "human", "value": "\nIs gray fabric shirt at upper center thinner than smooth yellow bread at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, gray fabric shirt at upper center might be wider than smooth yellow bread at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1eb5a4dd8f8da05e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white fluffy snow at center (B) satin black lamp post at center" }, { "from": "gpt", "value": "(B) satin black lamp post at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51d08fb083260a00.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) green matte eye at upper left (B) dark brown hair at upper center (C) green matte eye at center, is positioned closest to the brown hair at upper center?" }, { "from": "gpt", "value": "(A) green matte eye at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0276efdbb6da5750.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte blue sweater at center (B) dark blue sweater at center (C) light blue fabric baby at center (D) dark blue fabric at left" }, { "from": "gpt", "value": "(A) matte blue sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91f631672d120443.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) metallic silver bus at center (B) transparent glass train window at center" }, { "from": "gpt", "value": "(A) metallic silver bus at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0d405e3c7153acb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if rough stone cave at center is positioned to the right of dark brown leather backpack at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, rough stone cave at center is to the left of dark brown leather backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8c22e1cc0a2477d.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver glass building at center appear over white stone tower at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, silver glass building at center is not positioned above white stone tower at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9615c85924a2e086.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray rough rock at lower right have a larger size compared to gray rock at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, gray rough rock at lower right is not bigger than gray rock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3ffb51704327b3a.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy field at center to the right of green grassy path at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green grassy field at center is to the right of green grassy path at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f64d66f357711b7c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.918, 0.833) (B) (0.822, 0.834) (C) (0.132, 0.702)" }, { "from": "gpt", "value": "(A) (0.918, 0.833)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f329047d6adb39a3.jpg", "conversations": [ { "from": "human", "value": "\nDoes dead wood tree at left have a smaller size compared to green leafy bush at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, dead wood tree at left might be larger than green leafy bush at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b529e65fdad116bf.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the white wooden boat at center from the following options: (A) rusty wood boat at center (B) smooth dark blue water at center (C) wooden planks at center (D) wooden boat at center?" }, { "from": "gpt", "value": "(A) rusty wood boat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5b5e7e02efa3241.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte black car at upper left (B) silver metallic hatchback at upper left (C) white matte car at center" }, { "from": "gpt", "value": "(B) silver metallic hatchback at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4d558776dd49b78.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the shiny black sedan at left among (A) dark gray coat at center (B) gray concrete sidewalk at center (C) dark gray fabric jacket at lower right?" }, { "from": "gpt", "value": "(B) gray concrete sidewalk at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b4c3da955ee5cb8.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the white matte house at lower left? (A) wooden cabin at left (B) white corrugated metal hut at center" }, { "from": "gpt", "value": "(B) white corrugated metal hut at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b821ba1aa4bc026.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) black turtleneck sweater at center (B) matte black sweater at center" }, { "from": "gpt", "value": "(B) matte black sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43ce1bd1c927d623.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at upper center further to camera compared to beige sandy beach at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8b54c971706fb56.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.463, 0.662) (B) (0.797, 0.591) (C) (0.836, 0.811)" }, { "from": "gpt", "value": "(B) (0.797, 0.591)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46c5d45c6e9b7bc3.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) metallic silver shovel at center (B) blue matte shirt at center" }, { "from": "gpt", "value": "(B) blue matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ef372b67b738bd0.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of smooth bark tree at right more distant than that of striped jersey at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfc170a577ed7319.jpg", "conversations": [ { "from": "human", "value": "\nIs brown textured shirt at center bigger than metallic gray boat at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ed019a351c483ee.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.363, 0.289) (B) (0.147, 0.491) (C) (0.879, 0.452)" }, { "from": "gpt", "value": "(A) (0.363, 0.289)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/925ec40e8e2fe1fd.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cloth napkin at lower left is smaller than blue surgical mask at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3867bbb09f89214a.jpg", "conversations": [ { "from": "human", "value": "\nIs green soft grass at lower center smaller than green grassy mountain range at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green soft grass at lower center has a smaller size compared to green grassy mountain range at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a1cb63d7fb75b3e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) matte black scarf at left (B) white satin dress at center (C) light blue cotton shirt at right" }, { "from": "gpt", "value": "(A) matte black scarf at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7610cfeb82b71018.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte brown pants at center appear over matte orange kayak at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3baf02adaf036b5e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) green matte baseball cap at left (B) polychrome mosaic dragon at center" }, { "from": "gpt", "value": "(A) green matte baseball cap at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6566c14a826aad98.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte shirt at left above translucent plastic game at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, black matte shirt at left is positioned over translucent plastic game at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88bea97db747d2b4.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at upper center smaller than green textured tree at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green leafy tree at upper center has a smaller size compared to green textured tree at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89d75721933b9d8b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) dark blue wool coat at right (B) dark gray suit at left (C) patterned silk tie at center" }, { "from": "gpt", "value": "(B) dark gray suit at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11e733516e3982e2.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.421, 0.922) (B) (0.090, 0.845) (C) (0.866, 0.736) (D) (0.954, 0.100)" }, { "from": "gpt", "value": "(A) (0.421, 0.922)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf516e9cbeaf06d7.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) rustic stone wall at right (B) green grassy at center (C) dirt path at center" }, { "from": "gpt", "value": "(B) green grassy at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7690d258aaa7f5d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) plaid cotton shirt at center (B) black matte shirt at center (C) white t-shirt at center" }, { "from": "gpt", "value": "(B) black matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae32eda7d4bb5796.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gray climbing harness at center smaller than green nylon rope at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte gray climbing harness at center is not smaller than green nylon rope at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e574bf42a88dab29.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.909, 0.545) (B) (0.220, 0.275)" }, { "from": "gpt", "value": "(B) (0.220, 0.275)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0f3da7d358565b7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.900, 0.859) (B) (0.980, 0.938)" }, { "from": "gpt", "value": "(A) (0.900, 0.859)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f992dc46c8efedaa.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) shiny chrome bicycle at center (B) smooth skin face at upper center (C) teal fabric dress at center (D) matte blue banner at upper center, is positioned closest to the blue plaid shorts at right?" }, { "from": "gpt", "value": "(B) smooth skin face at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6eeae4709bd07ff3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange satin skirt at center is positioned above matte plastic doll at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, orange satin skirt at center is below matte plastic doll at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1ad2e1f3bb072ab.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) black liquid water at center (B) blue matte uniform at center" }, { "from": "gpt", "value": "(B) blue matte uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6b6f57cf2f76083.jpg", "conversations": [ { "from": "human", "value": "\nIs rusty brown rock at right smaller than yellow lustrous tree at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, rusty brown rock at right has a smaller size compared to yellow lustrous tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/739758281f3da75e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if granite eagle at center is positioned above polished bronze statue at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, granite eagle at center is positioned over polished bronze statue at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf93f82c7681e667.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the shiny silver fish at upper left from the following options: (A) dark brown textured fish at lower right (B) white coral at center?" }, { "from": "gpt", "value": "(B) white coral at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9396e77eb1381d0e.jpg", "conversations": [ { "from": "human", "value": "\nIs blue down jacket at center wider than dark green jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, blue down jacket at center has a greater width compared to dark green jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a6fb78e2404210f.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte t-shirt at left have a greater width compared to black zip-up hoodie at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green matte t-shirt at left has a greater width compared to black zip-up hoodie at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67046e4b155fdc4e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) satin black monitor at upper right (B) matte black monitor at left" }, { "from": "gpt", "value": "(B) matte black monitor at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/752377dc3b463bb7.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.615, 0.744) (B) (0.558, 0.475) (C) (0.112, 0.812)" }, { "from": "gpt", "value": "(B) (0.558, 0.475)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b5fd5d6f6bb8c90.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white silk kimono at center (B) yellow fabric curtain at upper center" }, { "from": "gpt", "value": "(A) white silk kimono at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf638ec72983c289.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the brown dirt field at center from the following options: (A) white plastic fence at left (B) brown wooden fence at center?" }, { "from": "gpt", "value": "(B) brown wooden fence at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b17925b9184e864.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.254, 0.697) (B) (0.499, 0.561) (C) (0.823, 0.480)" }, { "from": "gpt", "value": "(B) (0.499, 0.561)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b172c34a2f58e8d4.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue shirt at center bigger than blood-stained fabric mask at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, matte blue shirt at center has a larger size compared to blood-stained fabric mask at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/caf2305ea680fe14.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue pinstripe suit at center have a lesser width compared to green fabric flag at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a35dbb19d774e04.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the red striped tie at left? Choose from: (A) light gray silk tie at center (B) matte black suit at left (C) matte black suit at center (D) black matte blazer at center" }, { "from": "gpt", "value": "(B) matte black suit at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba2fba9c28ed5550.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black mask at center is thinner than matte black umbrella at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, matte black mask at center might be wider than matte black umbrella at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72b9f2d4533e2f5a.jpg", "conversations": [ { "from": "human", "value": "\nDoes white cotton shirt at center have a larger size compared to matte black helmet at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, white cotton shirt at center is larger in size than matte black helmet at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e1b19be3ad33f23.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black sweater at center further to the viewer compared to purple fleece jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f8bbed30993664d.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte pumpkin at center to the left of white matte pumpkin at upper center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white matte pumpkin at center is to the left of white matte pumpkin at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a8085e04800d555.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) silver metallic spire at upper center (B) bare branches at right" }, { "from": "gpt", "value": "(A) silver metallic spire at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ebff7946a0990be5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) silver metallic laptop at center (B) blue fabric shirt at center (C) silver/black keyboard at center" }, { "from": "gpt", "value": "(C) silver/black keyboard at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd39217b71f6d1e2.jpg", "conversations": [ { "from": "human", "value": "\nDoes translucent plastic water bottle at center appear under black plastic microphone at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, translucent plastic water bottle at center is below black plastic microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15e71b34556f1853.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.299, 0.608) (B) (0.157, 0.741) (C) (0.019, 0.797) (D) (0.796, 0.219)" }, { "from": "gpt", "value": "(C) (0.019, 0.797)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d0612954856c415.jpg", "conversations": [ { "from": "human", "value": "\nIs dirtloose soildirt field at center bigger than white marble cross at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d53df60bf8faff4f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if fuzzy black dress at center is positioned below glittery tights at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, fuzzy black dress at center is above glittery tights at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30cf16fe1acfb67d.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of shiny gold drum at center in relation to maroon silk robe at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe63fe2988525e95.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) gray asphalt tarmac at center (B) white matte airplane at center" }, { "from": "gpt", "value": "(A) gray asphalt tarmac at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/291deb63a28de0f8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the gray fabric shirt at center? Select from: (A) purple cotton shirt at center (B) white cotton shirt at right (C) gray matte t-shirt at lower left (D) matte black sunglasses at lower left" }, { "from": "gpt", "value": "(A) purple cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8933210d6f98c88.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of dark gray coat at center in relation to dark blue jeans at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7292ee8a4ef1f614.jpg", "conversations": [ { "from": "human", "value": "\nIs matte orange life vest at center smaller than red life jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, matte orange life vest at center might be larger than red life jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cc78efd5f077099.jpg", "conversations": [ { "from": "human", "value": "\nWhere is blue striped polo shirt at left located in relation to plaid fabric shirt at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e4b00c01d58e79e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) navy blue polka dot fabric dress at left (B) black matte shirt at center" }, { "from": "gpt", "value": "(A) navy blue polka dot fabric dress at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56bb782c4e9986b7.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) shiny black car at right (B) silver metallic car at center" }, { "from": "gpt", "value": "(A) shiny black car at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5581b51fb619026.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue textured tie at center is thinner than teal satin dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, blue textured tie at center is thinner than teal satin dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e835d87f324bdd63.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red fabric at center closer to the viewer compared to golden silk saree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte red fabric at center is behind golden silk saree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d4f0a7591fbce95.jpg", "conversations": [ { "from": "human", "value": "\nDoes white plastic window at center have a greater width compared to transparent plastic window at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white plastic window at center has a greater width compared to transparent plastic window at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00dd8db7c96692f1.jpg", "conversations": [ { "from": "human", "value": "\nIs brown textured buildings at center to the right of greenish water at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, brown textured buildings at center is not to the right of greenish water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23781687dec0cf64.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the rustic metal drilling rig at center? (A) metallic silver truck at center (B) rusty metal drilling rig at center (C) dusty red soil at center" }, { "from": "gpt", "value": "(A) metallic silver truck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b5652c20e3eac5a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) yellow matte shirt at right (B) matte pink lace dress at center" }, { "from": "gpt", "value": "(A) yellow matte shirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b793d961da49386.jpg", "conversations": [ { "from": "human", "value": "\nDoes metal mesh fence at upper center lie in front of spotted fur cheetah at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a60d3a3127634a27.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the green mossy algae at lower center? Choose among these: (A) yellow matte water taxi at center (B) blue matte jacket at center (C) blue fabric backpack at center (D) black matte backpack at center" }, { "from": "gpt", "value": "(D) black matte backpack at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5055f7dc6a8d108.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.699, 0.545) (B) (0.293, 0.755) (C) (0.194, 0.727)" }, { "from": "gpt", "value": "(A) (0.699, 0.545)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df0eef2184da4b8a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.476, 0.809) (B) (0.583, 0.448) (C) (0.403, 0.967)" }, { "from": "gpt", "value": "(B) (0.583, 0.448)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d98da37fa0231e3.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) gray matte shirt at center (B) matte pink t-shirt at center" }, { "from": "gpt", "value": "(A) gray matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0ff26b3079682fe.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) camouflage uniform at center (B) camouflage fabric uniform at right" }, { "from": "gpt", "value": "(A) camouflage uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b1d7dd1c4ffca3b.jpg", "conversations": [ { "from": "human", "value": "\nIs red leather couch at center thinner than white leather jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c23132ffe08b58db.jpg", "conversations": [ { "from": "human", "value": "\nDoes red-orange sweater at center come behind shiny metallic bicycle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36591e48ae247d66.jpg", "conversations": [ { "from": "human", "value": "\nIs white fabric dress at left above white matte jacket at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white fabric dress at left is not positioned above white matte jacket at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/702541776326853e.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black hoodie at center have a greater width compared to matte black vest at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte black hoodie at center's width does not surpass matte black vest at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71616cdf96ee2fba.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) matte blue card at lower right (B) blue glossy text at bottom center" }, { "from": "gpt", "value": "(B) blue glossy text at bottom center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d20eb27256a8baa.jpg", "conversations": [ { "from": "human", "value": "\nIs green checkered shirt at center below matte black suit at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green checkered shirt at center is below matte black suit at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1687223dbb6bb83e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green matte dress at left (B) matte black suit at left (C) blue silk tie at center" }, { "from": "gpt", "value": "(A) green matte dress at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b42a811094d80506.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the light brown leather jacket at center among (A) pink fabric person at center (B) dark gray fabric jacket at center (C) red leather jacket at center (D) green wooden temple at center?" }, { "from": "gpt", "value": "(D) green wooden temple at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79937d719b727d60.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric baby carriage at center wider than black fabric jacket at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45b04906c1eabca5.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent glass pool at center appear under green grassy bush at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, transparent glass pool at center is below green grassy bush at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63808b9cf002eaa5.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is gray striped shirt at center located relative to blue textured sweater at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1005b0090daf894.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the matte black cap at center? Select from: (A) matte black cap at upper center (B) gray striped shirt at center" }, { "from": "gpt", "value": "(B) gray striped shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bedfa19202081d1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy palm tree at left is positioned above green leafy palm tree at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green leafy palm tree at left is above green leafy palm tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7603230f080ce37.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if camouflage tank top at right is positioned to the right of purple fabric shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, camouflage tank top at right is positioned on the right side of purple fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7245c65a345cf1e.jpg", "conversations": [ { "from": "human", "value": "\nIs brown wooden rail at center bigger than dark brown wooden boat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, brown wooden rail at center is larger in size than dark brown wooden boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8b68e04bc64fe48.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.203, 0.887) (B) (0.493, 0.955) (C) (0.735, 0.825)" }, { "from": "gpt", "value": "(A) (0.203, 0.887)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82ca7a3bb5cd09e1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red matte ear protection at upper left is wider than camouflage fabric uniform at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, red matte ear protection at upper left might be narrower than camouflage fabric uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d436479098872438.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) matte black train at center (B) shiny silver train at center (C) red matte freight train at center" }, { "from": "gpt", "value": "(B) shiny silver train at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4783b4e8439ed86.jpg", "conversations": [ { "from": "human", "value": "\nIs black cast iron frying pan at center further to the viewer compared to brown crusty bread at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bd98ba0763714f7.jpg", "conversations": [ { "from": "human", "value": "\nIs black and tan fur at center to the right of black leather harness at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, black and tan fur at center is to the right of black leather harness at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7da4cd8cdf372a7.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black vest at center smaller than blue denim skirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, matte black vest at center might be larger than blue denim skirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d93f7de3501274ac.jpg", "conversations": [ { "from": "human", "value": "\nIs bronze statue at center positioned before matte black cane at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d882594140c1f23c.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is camo fabric backpack at center located relative to camo fabric backpack at left? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/423dd6bc50f7234b.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the metallic gray crane at center among (A) blue metallic crane at center (B) metallic blue crane at upper left (C) dark wood dock at lower right?" }, { "from": "gpt", "value": "(A) blue metallic crane at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94aee240f3e198e1.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black van at left to the right of matte gray minivan at right from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte black van at left is not on the right side of matte gray minivan at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/070a72b7141b80c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the white shirt at center? Select from: (A) light blue fabric baby at center (B) green artificial turf at center" }, { "from": "gpt", "value": "(A) light blue fabric baby at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9a10fcfcc7d4e73.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte tree at center bigger than brown wooden fence at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green matte tree at center is bigger than brown wooden fence at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3875fd45d52f30fd.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the brown rough stone at center? (A) green rough stone at center (B) transparent wooden door at upper center" }, { "from": "gpt", "value": "(A) green rough stone at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c34d5f5d5d5fead2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.142, 0.188) (B) (0.556, 0.469) (C) (0.233, 0.216)" }, { "from": "gpt", "value": "(C) (0.233, 0.216)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a40d8f5549504724.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) brown wicker chair at upper left (B) brown plastic table at center" }, { "from": "gpt", "value": "(A) brown wicker chair at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c49fa4fffa40587b.jpg", "conversations": [ { "from": "human", "value": "\nIs red rubber track at lower center closer to the viewer compared to purple cotton shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21b67c443021a195.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of golden fur dog at lower left and golden fur dog at upper center in the image provided, where is golden fur dog at lower left located with respect to golden fur dog at upper center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14a0d9d1f026d2a3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.578, 0.436) (B) (0.980, 0.967)" }, { "from": "gpt", "value": "(B) (0.980, 0.967)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1168a4f41d81d794.jpg", "conversations": [ { "from": "human", "value": "\nIs white smooth shirt at upper center above white matte fabric at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white smooth shirt at upper center is not above white matte fabric at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c50f811554f4d2bb.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the blonde hair at center? (A) matte black saxophone at left (B) green matte poster at center (C) matte black jacket at center (D) translucent glass portrait at right" }, { "from": "gpt", "value": "(A) matte black saxophone at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7065bc63c664a7d.jpg", "conversations": [ { "from": "human", "value": "\nWhere is silver metallic sedan at lower left located in relation to metallic silver sedan at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75234c8f1d8e75a3.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black backpack at center have a lesser width compared to matte black backpack at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black backpack at center is thinner than matte black backpack at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a024586ce7b81964.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown wooden table at center have a greater width compared to velvet-like red figure at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, dark brown wooden table at center is wider than velvet-like red figure at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cf002adfc61f047.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white plastic laptop at upper right (B) white fluffy teddy bear at upper left (C) silver metallic recorder at lower left" }, { "from": "gpt", "value": "(B) white fluffy teddy bear at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9ae7cd1f0b55cdd.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red shirt at upper left have a greater width compared to satin silver car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte red shirt at upper left is not wider than satin silver car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b8b10cc69fbebee.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent water at center have a larger size compared to green matte tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, transparent water at center is not larger than green matte tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55b2d6c380071587.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.222, 0.994) (B) (0.767, 0.487) (C) (0.936, 0.672) (D) (0.509, 0.750)" }, { "from": "gpt", "value": "(B) (0.767, 0.487)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61f56e4fcc7e78fe.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) black matte shirt at center (B) gray water at upper center" }, { "from": "gpt", "value": "(B) gray water at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f07cc8c86d928b7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if turquoise beaded necklace at center is smaller than leather jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, turquoise beaded necklace at center is smaller than leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a5a4d88e558f2e8.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny metallic river at center to the right of white frothy water at left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, shiny metallic river at center is to the right of white frothy water at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9f6e686c6796562.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.695, 0.642) (B) (0.445, 0.820) (C) (0.398, 0.405)" }, { "from": "gpt", "value": "(C) (0.398, 0.405)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32a56300eea607f5.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gray tank top at center further to the viewer compared to white cotton shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ea50bb2da07a5af.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) wooden frame bicycle at center (B) matte black bicycle at left" }, { "from": "gpt", "value": "(B) matte black bicycle at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6a35e521de3790a.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the sparkly gray sweater at center? (A) smooth white shirt at center (B) black and white fabric flag at center (C) blonde hair at center" }, { "from": "gpt", "value": "(C) blonde hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c8e9baa63b09118.jpg", "conversations": [ { "from": "human", "value": "\nDoes black fleece jacket at left have a smaller size compared to black fabric jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black fleece jacket at left is smaller than black fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e23fa0dcf52f504d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.495, 0.686) (B) (0.594, 0.880)" }, { "from": "gpt", "value": "(B) (0.594, 0.880)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2097e9d06702a53a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grassy field at lower center is bigger than wooden barn at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green grassy field at lower center has a larger size compared to wooden barn at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/030da4f750bf2468.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte green sweater at center is positioned to the right of black matte turtleneck at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find matte green sweater at center to the right of black matte turtleneck at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2cdddd13b1e5e644.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown dry grass at center is thinner than brown dirt track at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, brown dry grass at center is not thinner than brown dirt track at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68163df12b261f3e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) woven wood armchair at right (B) wooden armchair at center" }, { "from": "gpt", "value": "(B) wooden armchair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0d80bf03a63850c.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of black smooth shirt at center in relation to wooden sign at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c919547d5ee78736.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at center is smaller than clear water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green leafy tree at center is not smaller in size than clear water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb087cfa0fc07571.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray shirt at center is positioned to the right of matte brown shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find dark gray shirt at center to the right of matte brown shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d72647de6c30ed66.jpg", "conversations": [ { "from": "human", "value": "\nIs black smooth shirt at right smaller than matte black person at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black smooth shirt at right is not smaller in size than matte black person at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2dd9d21442491669.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the green leafy branch at upper right? (A) green leafy tree at center (B) stone church at center" }, { "from": "gpt", "value": "(A) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ea64cc4f6bf12f0.jpg", "conversations": [ { "from": "human", "value": "\nIs light brown wooden chair at lower right closer to the viewer compared to wooden chair at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58340d0cccdb3ea8.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) shiny red silk lantern at center (B) dark gray textured tiles at upper center (C) satin red lantern at center" }, { "from": "gpt", "value": "(A) shiny red silk lantern at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26df1aea7e374f43.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.427, 0.637) (B) (0.020, 0.945) (C) (0.553, 0.823)" }, { "from": "gpt", "value": "(B) (0.020, 0.945)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c90d672ce2aa10f.jpg", "conversations": [ { "from": "human", "value": "\nDoes metallic blue menorah at upper left appear on the right side of white soft sweater at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, metallic blue menorah at upper left is not to the right of white soft sweater at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8132f518688e4dd4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white cotton dress at center (B) shiny silver headdress at upper right (C) matte brown leather moccasins at center (D) multicolored feathered vest at center" }, { "from": "gpt", "value": "(C) matte brown leather moccasins at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24825cc1f7daf852.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.372, 0.591) (B) (0.237, 0.545)" }, { "from": "gpt", "value": "(B) (0.237, 0.545)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42e28fae72250c16.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.492, 0.652) (B) (0.570, 0.338) (C) (0.796, 0.508) (D) (0.115, 0.880)" }, { "from": "gpt", "value": "(C) (0.796, 0.508)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f7498e6b4673519.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) white glossy swan at center (B) gray downy cygnet at center" }, { "from": "gpt", "value": "(A) white glossy swan at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e925ed7343eb2e5f.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric canopy at upper left wider than green fabric clown at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6523fc8f8b14d0a3.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden fence at upper center positioned in front of shiny brown turkey at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e09049b6c0a4e057.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.429, 0.589) (B) (0.579, 0.791)" }, { "from": "gpt", "value": "(B) (0.579, 0.791)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c62877c1910cba90.jpg", "conversations": [ { "from": "human", "value": "\nIs rustic wooden building at center thinner than brown wooden fence at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, rustic wooden building at center might be wider than brown wooden fence at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3cffc466255abfd4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) brown woolen alpaca at right (B) brown fuzzy alpaca at center, is positioned closest to the black glossy alpaca at center?" }, { "from": "gpt", "value": "(B) brown fuzzy alpaca at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98de1770428e9ce7.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte black wheelchair at center located relative to silver metallic car at right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/795726e4778797ff.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the matte red coat at center? Select from: (A) matte red coat at left (B) watercolor portrait of man with long beard at center (C) matte red vest at center" }, { "from": "gpt", "value": "(B) watercolor portrait of man with long beard at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e64ae149cd0467c7.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.898, 0.631) (B) (0.530, 0.942)" }, { "from": "gpt", "value": "(A) (0.898, 0.631)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff09227c7e5e91dc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte bus at left is smaller than shiny black sedan at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/009c98d4a32ba3c4.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is dark gray fleece at center located relative to black suede boot at lower center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/544b57c858d5ce04.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) matte gray apron at center (B) yellow dough at lower left (C) matte black jacket at upper left, is positioned farthest from the yellow dough at center?" }, { "from": "gpt", "value": "(C) matte black jacket at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e572e237bcae16c5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte canopy at center is positioned to the right of white cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green matte canopy at center is to the right of white cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55d02fca2c12a4fe.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.367, 0.647) (B) (0.439, 0.978)" }, { "from": "gpt", "value": "(A) (0.367, 0.647)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0af9f3cff1173b18.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.229, 0.666) (B) (0.617, 0.858)" }, { "from": "gpt", "value": "(B) (0.617, 0.858)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe5a83243b52395a.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte shirt at center to the right of black plastic keyboard at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, black matte shirt at center is not to the right of black plastic keyboard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b7aa5031d720096.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black backpack at center-left come in front of wire mesh fence at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black backpack at center-left is in front of wire mesh fence at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cc2b8535339b089.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.965, 0.792) (B) (0.286, 0.492) (C) (0.503, 0.795)" }, { "from": "gpt", "value": "(B) (0.286, 0.492)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a440b3ec8836f0b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white fleece jacket at left is thinner than black matte jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white fleece jacket at left's width is not less than black matte jacket at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfc9f12257beaea1.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) pink matte suv at center (B) green spiny cactus at center (C) green leafy bush at center" }, { "from": "gpt", "value": "(A) pink matte suv at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbcf72478cb694be.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.484, 0.512) (B) (0.345, 0.756) (C) (0.703, 0.745)" }, { "from": "gpt", "value": "(C) (0.703, 0.745)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25c026285699be6e.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green textured tree at upper left located in relation to green matte tree at upper center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/434c22b2d2137d34.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of granite rock formation at center in relation to green grassy hill at upper left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/183472b25989ec52.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) sunglasses at lower left (B) white shirt at center, is positioned closest to the black matte microphone at center?" }, { "from": "gpt", "value": "(A) sunglasses at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab938cf74430e1da.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped sweater at center have a lesser width compared to striped fabric baby at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, striped sweater at center's width is not less than striped fabric baby at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b82c858c5a7da38a.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of blue water at center and white glossy yacht at right in the image provided, where is blue water at center located with respect to white glossy yacht at right? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a10471e7e6280e8.jpg", "conversations": [ { "from": "human", "value": "\nDoes brick gas station at center appear on the left side of black matte truck at center right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find brick gas station at center to the left of black matte truck at center right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2250154c6365cbb.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton shirt at center wider than red striped scarf at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of white cotton shirt at center exceeds that of red striped scarf at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4618dd86add3590.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is floral kimono at center located relative to gray concrete rail at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfe4908d910dcbcc.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.042, 0.212) (B) (0.095, 0.936)" }, { "from": "gpt", "value": "(A) (0.042, 0.212)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c91eb39a1d12c38c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) woven wood basket at center (B) white crumbly bread at center (C) denim overalls at center" }, { "from": "gpt", "value": "(A) woven wood basket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e01b73bd0a7f56db.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if plaid shirt at left is positioned above metallic silver creamer at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c042b6d6b7b1b95.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.637, 0.322) (B) (0.520, 0.303) (C) (0.850, 0.470)" }, { "from": "gpt", "value": "(B) (0.520, 0.303)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fbd137cbac848df.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if denim shirt at left is wider than black matte microphone at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, denim shirt at left has a greater width compared to black matte microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/489e7d002969b654.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.630, 0.650) (B) (0.755, 0.467) (C) (0.706, 0.459)" }, { "from": "gpt", "value": "(B) (0.755, 0.467)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df3ee949d68be52d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the brown wooden telegraph pole at right? Choose among these: (A) green leafy tree at upper left (B) wooden bench at lower center" }, { "from": "gpt", "value": "(B) wooden bench at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47de549235edb0f0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the white stone tower at upper left? Select from: (A) yellow-green foliage at center (B) wooden gate at center" }, { "from": "gpt", "value": "(A) yellow-green foliage at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00ec8d6b8da34933.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) dark gray fabric hand at lower right (B) matte black hand at center" }, { "from": "gpt", "value": "(B) matte black hand at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa89bf40d484cc9a.jpg", "conversations": [ { "from": "human", "value": "\nIs purple tulle dress at left in front of yellow satin dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bb53d30163613fa.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.772, 0.555) (B) (0.836, 0.417) (C) (0.213, 0.964)" }, { "from": "gpt", "value": "(A) (0.772, 0.555)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1619201481b925f9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.383, 0.613) (B) (0.344, 0.322)" }, { "from": "gpt", "value": "(B) (0.344, 0.322)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/714e6e2f22379304.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of gray sweater at center in relation to purple fleece jacket at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/936ea80951140c8f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.309, 0.344) (B) (0.662, 0.561) (C) (0.140, 0.803)" }, { "from": "gpt", "value": "(A) (0.309, 0.344)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67505099f6f51d50.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.573, 0.761) (B) (0.681, 0.444) (C) (0.315, 0.231)" }, { "from": "gpt", "value": "(B) (0.681, 0.444)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8ca30bc04b38825.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if denim jeans at center is positioned below matte blue shirt at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6fb5657b09075bd9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) iridescent shiny tree at center (B) shiny gold dress at right" }, { "from": "gpt", "value": "(A) iridescent shiny tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/863f28253ad815bc.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the purple cotton t-shirt at left? (A) purple cotton shirt at left (B) camouflage pants at center (C) wooden bookshelf at center" }, { "from": "gpt", "value": "(A) purple cotton shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/904a2c3899f7a30b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if frosted white tree at right is thinner than white frosty tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, frosted white tree at right is not thinner than white frosty tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/267ce3cc0ac492ba.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.811, 0.702) (B) (0.170, 0.508) (C) (0.706, 0.520)" }, { "from": "gpt", "value": "(A) (0.811, 0.702)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5f245f7b1984fe3.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.164, 0.948) (B) (0.667, 0.905)" }, { "from": "gpt", "value": "(A) (0.164, 0.948)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d12e935881c67a2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black jacket at center is positioned to the right of gray sketch heart at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black jacket at center is to the right of gray sketch heart at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0691e52f1cf5641.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the red silk tie at center? (A) wooden picture frame at upper center (B) brown wool coat at lower right (C) blue fabric suit at upper center (D) gray checkered suit at center" }, { "from": "gpt", "value": "(A) wooden picture frame at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8401b0d7d007c88d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.365, 0.808) (B) (0.067, 0.128) (C) (0.002, 0.789)" }, { "from": "gpt", "value": "(C) (0.002, 0.789)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b20ff2d3dd2fe35f.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the silver metallic car at lower left from the following options: (A) yellow-black striped barrier at center (B) white matte suv at lower left?" }, { "from": "gpt", "value": "(A) yellow-black striped barrier at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/068f7b1e6627a34a.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink plastic spoon at mouth appear on the left side of pink rubber spoon at mouth? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, pink plastic spoon at mouth is not to the left of pink rubber spoon at mouth." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5716ca2c5c3c23e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.341, 0.613) (B) (0.545, 0.408)" }, { "from": "gpt", "value": "(A) (0.341, 0.613)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab7d86f44b01846e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.741, 0.952) (B) (0.843, 0.433)" }, { "from": "gpt", "value": "(A) (0.741, 0.952)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17c9747b57932762.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.379, 0.686) (B) (0.259, 0.264)" }, { "from": "gpt", "value": "(B) (0.259, 0.264)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a800731abee5563.jpg", "conversations": [ { "from": "human", "value": "\nIs rusty teal pickup truck at center wider than yellow matte license plate at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, rusty teal pickup truck at center has a greater width compared to yellow matte license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88fbd2f480635c20.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.091, 0.736) (B) (0.233, 0.947)" }, { "from": "gpt", "value": "(B) (0.233, 0.947)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0095bd82ea4131d5.jpg", "conversations": [ { "from": "human", "value": "\nIs brown concrete tower at left below brown textured tower at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, brown concrete tower at left is positioned under brown textured tower at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22602aa70a8a33f1.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the dark gray sweater at center? Choose from: (A) matte gray sweater at center (B) patterned fabric backpack at center (C) smooth black shirt at right (D) white mesh shoe at upper right" }, { "from": "gpt", "value": "(B) patterned fabric backpack at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e75d48087c96ea9c.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of translucent plastic toothbrush at center in reference to pink translucent toothbrush at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e38cd61a4e50866b.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black shirt at center smaller than black matte hair at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, matte black shirt at center might be larger than black matte hair at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/889601b4fce02d68.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.864, 0.666) (B) (0.323, 0.570)" }, { "from": "gpt", "value": "(B) (0.323, 0.570)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8791fddd92e56c6c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the white fur dog at center? Choose among these: (A) transparent glass window at upper center (B) white fur at center" }, { "from": "gpt", "value": "(A) transparent glass window at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9acd341f8d77b43.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the shiny blue sedan at lower right? Select from: (A) white matte car at lower center (B) silver metallic sedan at lower left (C) silver metallic car at lower center" }, { "from": "gpt", "value": "(A) white matte car at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91c1044d78c94333.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black suit at center located in relation to gray matte beard at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c56afaeab5ba44e6.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue dress at center have a larger size compared to blue fabric dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, matte blue dress at center is larger in size than blue fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14539d42ea787708.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) white matte shirt at center (B) white matte shirt at upper right (C) striped jersey at center (D) light brown matte nuts at center" }, { "from": "gpt", "value": "(B) white matte shirt at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6616f75ef183ef2e.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green leafy forest at left and green leafy tree at center in the image provided, where is green leafy forest at left located with respect to green leafy tree at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa9ac5bdfb832ade.jpg", "conversations": [ { "from": "human", "value": "\nDoes bright blue glossy screen at center have a larger size compared to white plastic entertainment center at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, bright blue glossy screen at center is larger in size than white plastic entertainment center at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b6d49549762166f.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the purple matte shirt at center-left? (A) dark brown leather jacket at center (B) red matte jacket at lower right (C) dark blue jacket at center" }, { "from": "gpt", "value": "(C) dark blue jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1695a0f4ccf31449.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray gravel trail at center appear on the left side of green matte tree at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, gray gravel trail at center is not to the left of green matte tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0055fdc49b46352a.jpg", "conversations": [ { "from": "human", "value": "\nDoes green textured tree at center appear on the right side of green leafy tree at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, green textured tree at center is to the left of green leafy tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22cdfc2995ed8a78.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green grass at lower center and brown fur deer at center in the image provided, where is green grass at lower center located with respect to brown fur deer at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02b1b0ddeac1366d.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of speckled ceramic mug at center and blue textured book at center in the image provided, where is speckled ceramic mug at center located with respect to blue textured book at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d838582e442766a3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if striped flannel shirt at center is positioned below striped cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, striped flannel shirt at center is below striped cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a591c0b147c016cb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) clear water at center (B) white glossy boat at lower left (C) green matte canoe at lower right (D) white glossy boat at center" }, { "from": "gpt", "value": "(D) white glossy boat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17472adc973f002d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.206, 0.441) (B) (0.694, 0.119) (C) (0.040, 0.527)" }, { "from": "gpt", "value": "(B) (0.694, 0.119)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5a59ea303b059ec.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy sailboat at center is positioned below wooden dock at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white glossy sailboat at center is not below wooden dock at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56de7025fcb9ccd8.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at left come behind dark green leafy tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a61512b38c1062e.jpg", "conversations": [ { "from": "human", "value": "\nDoes white cotton shorts at center come behind reddish-brown shorts at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is behind reddish-brown shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c0537f3d0783689.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the orange fabric shirt at center? Choose from: (A) flesh-toned skin at center (B) brick fireplace at center" }, { "from": "gpt", "value": "(B) brick fireplace at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b047b438cd61f5f8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.488, 0.711) (B) (0.075, 0.784)" }, { "from": "gpt", "value": "(B) (0.075, 0.784)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d81f6053888720c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) green leafy tree at center (B) brown dirt track at center" }, { "from": "gpt", "value": "(A) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1bc7f875dcdaa63.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.868, 0.661) (B) (0.117, 0.767)" }, { "from": "gpt", "value": "(A) (0.868, 0.661)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b3247622f314f95.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center to the left of brown rough bark tree at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, green leafy tree at center is not on the left side of brown rough bark tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1690b1514e924eb8.jpg", "conversations": [ { "from": "human", "value": "\nIs blue metallic station wagon at center closer to the viewer compared to light brown hair at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d0ee8809ade96de.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the plaid fabric skirt at center? Select from: (A) white matte lab coat at left (B) white matte skirt at center (C) blue plaid skirt at lower center" }, { "from": "gpt", "value": "(C) blue plaid skirt at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/326e06e702070a61.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) pink matte flower pot at lower left (B) shiny black crow at lower center (C) wooden deck at center (D) shiny gray cat at center" }, { "from": "gpt", "value": "(D) shiny gray cat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23d71b9bc57d7d47.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) gray fabric jacket at center (B) white glossy drum at center (C) white drum at center (D) green matte shirt at center" }, { "from": "gpt", "value": "(D) green matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78037d33d95a6544.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at lower right have a smaller size compared to blue wooden sign at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green grass at lower right is not smaller in size than blue wooden sign at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d77329ab560675a9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.706, 0.594) (B) (0.477, 0.484)" }, { "from": "gpt", "value": "(A) (0.706, 0.594)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ceda54a5733ca0da.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is green grassy field at center located relative to green leafy tree at right? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05e23f0fbdb213ff.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the shiny gold epaulets at left? (A) transparent glass window at center (B) blonde hair at left" }, { "from": "gpt", "value": "(B) blonde hair at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7e42db39794b751.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) red plaid shirt at left (B) pink satin dress at center (C) velvet pink skirt at center, is positioned farthest from the gray woolen robe at center?" }, { "from": "gpt", "value": "(A) red plaid shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aeef05485a9d79c2.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange-brown feathers at center have a larger size compared to shiny red berries at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, orange-brown feathers at center might be smaller than shiny red berries at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57ad561f578beecb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black striped sweater at center is thinner than gray zip-up sweater at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e25f75daa56b81e2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) glossy plastic container at center (B) red glossy pomegranate at upper right (C) yellow matte pear at right (D) red matte apple at upper right" }, { "from": "gpt", "value": "(A) glossy plastic container at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2eb853b134b95e48.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) metallic gray printer at center (B) metallic red hand truck at center" }, { "from": "gpt", "value": "(B) metallic red hand truck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4f0c47c30fa8366.jpg", "conversations": [ { "from": "human", "value": "\nIs bare branches at left below bare branches at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, bare branches at left is not below bare branches at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5dee40a83057f5be.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte shirt at center below floral fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white matte shirt at center is not positioned below floral fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c361738e1c257db4.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green grassy at center located in relation to fuzzy gray sheep at center in the image? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9029d6b1bd6edb37.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue fabric at center is positioned to the left of black fabric jacket at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find blue fabric at center to the left of black fabric jacket at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a2fbf58352fba88.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.892, 0.452) (B) (0.883, 0.183)" }, { "from": "gpt", "value": "(A) (0.892, 0.452)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c2b4d753a730435.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of metallic wire at upper center in reference to brown wooden telegraph pole at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60cd6b78597077f1.jpg", "conversations": [ { "from": "human", "value": "\nIs quilted fabric flag at center wider than clear water at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, quilted fabric flag at center is not wider than clear water at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9e617024a507f2e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the green textured tree at left among (A) green matte tree at center (B) green matte tree at center-right?" }, { "from": "gpt", "value": "(B) green matte tree at center-right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b60aa37dfea29ea.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte gold vase at center (B) golden glossy vase at center (C) gold metallic sarcophagus at center" }, { "from": "gpt", "value": "(B) golden glossy vase at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/511fae32ef614308.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of wooden gondola at center and black polished wood gondola at center in the image provided, where is wooden gondola at center located with respect to black polished wood gondola at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de9a6a46b08ac763.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the satin black smartphone at center? (A) matte white smartphone at center (B) black mesh shoe at lower right" }, { "from": "gpt", "value": "(A) matte white smartphone at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a841c56278b84ac.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.537, 0.464) (B) (0.093, 0.330)" }, { "from": "gpt", "value": "(A) (0.537, 0.464)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/544099f056e0a146.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic silver rover at upper right smaller than black matte display at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, metallic silver rover at upper right might be larger than black matte display at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b4f413603f4cbf9.jpg", "conversations": [ { "from": "human", "value": "\nIs black suit at left wider than long brown hair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, black suit at left has a greater width compared to long brown hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b33b3bcbea4b723.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.356, 0.316) (B) (0.186, 0.597) (C) (0.581, 0.547) (D) (0.902, 0.586)" }, { "from": "gpt", "value": "(A) (0.356, 0.316)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b9db0d3f9466307.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) glossy plastic dice at center (B) red glossy dice at center (C) black glossy dice at upper center" }, { "from": "gpt", "value": "(C) black glossy dice at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9013090da0b9bd57.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the blue fabric hospital bed at center from the following options: (A) white dotted hospital gown at center (B) metallic blue stethoscope at upper right?" }, { "from": "gpt", "value": "(B) metallic blue stethoscope at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae3b22c1834bcf61.jpg", "conversations": [ { "from": "human", "value": "\nIs matte purple blouse at center thinner than green plastic chair at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte purple blouse at center is thinner than green plastic chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c654e92e77bbfc87.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.427, 0.727) (B) (0.525, 0.766) (C) (0.231, 0.423)" }, { "from": "gpt", "value": "(C) (0.231, 0.423)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0dc614979dbd536.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown wooden bench at lower left appear on the right side of brown wooden bench at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, brown wooden bench at lower left is to the left of brown wooden bench at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45c688eb7d76b3b8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) brown matte honeycomb at center (B) brown fuzzy bee at center (C) white glove at center" }, { "from": "gpt", "value": "(B) brown fuzzy bee at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad9b2fa0f8b98085.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) rugged stone mountain at center (B) blue matte cargo ship at center (C) translucent ice at center" }, { "from": "gpt", "value": "(C) translucent ice at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5cefa75e2a8ea95.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.436, 0.561) (B) (0.356, 0.642) (C) (0.375, 0.445)" }, { "from": "gpt", "value": "(C) (0.375, 0.445)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70c9f5de64defe78.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of blue plaid shirt at center and blue striped shirt at center in the image provided, where is blue plaid shirt at center located with respect to blue striped shirt at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7dda5008fab4eb8.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the smooth plastic fishing pole at center? (A) camouflage fabric jacket at center (B) tan fabric jacket at center" }, { "from": "gpt", "value": "(B) tan fabric jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/466aa556b0ca32da.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of blue plastic recycling bin at center in reference to metallic red car at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ba6fb1587d69786.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) green grass at lower center (B) rusty metal excavator at center" }, { "from": "gpt", "value": "(B) rusty metal excavator at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08451cefd467b176.jpg", "conversations": [ { "from": "human", "value": "\nIs white woolly sheep at center bigger than soft woolen lamb at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white woolly sheep at center has a larger size compared to soft woolen lamb at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba72f906fda00d3a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.124, 0.244) (B) (0.903, 0.934)" }, { "from": "gpt", "value": "(B) (0.903, 0.934)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b77c03ec453ee86.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) black suit at left (B) black suit at right (C) gray suit at center (D) matte black suit at center" }, { "from": "gpt", "value": "(B) black suit at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/819fbd41d39e4058.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the dark blue water at lower center among (A) yellow rubber boat at lower center (B) yellow rubber boat at lower left?" }, { "from": "gpt", "value": "(B) yellow rubber boat at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2377c5ddb2edd25.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.764, 0.311) (B) (0.224, 0.166)" }, { "from": "gpt", "value": "(B) (0.224, 0.166)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/546d26e20b10258b.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at upper right smaller than transparent glass tower at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca6f6fd7a61c7fcd.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark green leafy tree at upper right is wider than metallic wire at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, dark green leafy tree at upper right is wider than metallic wire at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de10dcdc03393014.jpg", "conversations": [ { "from": "human", "value": "\nIs black plastic sign at upper left below stainless steel sink at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, black plastic sign at upper left is above stainless steel sink at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b381caa5460d20f0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy hillside at upper center is smaller than brick house at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ed8633f99cbabda.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is bronze fountain at center located relative to white stone palace at upper left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/853e39218cc8d951.jpg", "conversations": [ { "from": "human", "value": "\nIs dark fur bull at center wider than fuzzy dark brown bull at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, dark fur bull at center has a greater width compared to fuzzy dark brown bull at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed43b0a3ce24081c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the rainbow printed tank top at center? Choose among these: (A) white cotton shirt at center (B) gray cotton binoculars at right" }, { "from": "gpt", "value": "(A) white cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1518cb27034c1a28.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.477, 0.680) (B) (0.425, 0.420) (C) (0.510, 0.477)" }, { "from": "gpt", "value": "(C) (0.510, 0.477)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12c770a9bc540c37.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte blue life vest at left (B) black plastic sunglasses at center (C) blue life vest at center" }, { "from": "gpt", "value": "(C) blue life vest at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db32e7024364d3a4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.652, 0.181) (B) (0.742, 0.852)" }, { "from": "gpt", "value": "(A) (0.652, 0.181)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a8d2dbdf4d6965b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte black coat at left (B) white cable-knit sweater at center (C) blue fleece jacket at center (D) cable knit sweater at center" }, { "from": "gpt", "value": "(D) cable knit sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2566108efc804fd8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) smooth asphalt road at center (B) dark gray fabric jacket at center (C) shiny black car at center (D) red fabric person at center" }, { "from": "gpt", "value": "(A) smooth asphalt road at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9aa00da0d3f01698.jpg", "conversations": [ { "from": "human", "value": "\nDoes green mossy stone at lower center have a smaller size compared to green mossy stone at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, green mossy stone at lower center occupies less space than green mossy stone at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7857367808c4e79.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is brown wooden fence at center located relative to green leafy tree at left? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7b680315547c689.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray suit at center have a lesser width compared to black dotted dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b36e9edfe22bfd6b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the weathered wood barn at center? (A) brown woodpile at left (B) wooden barn at center" }, { "from": "gpt", "value": "(A) brown woodpile at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb455a449b30610b.jpg", "conversations": [ { "from": "human", "value": "\nDoes black plastic chair at upper right have a larger size compared to speckled feather pigeon at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, black plastic chair at upper right is bigger than speckled feather pigeon at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/714cc99fb52b264b.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue satin dress at center have a larger size compared to white fabric dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, blue satin dress at center has a larger size compared to white fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f93e84084b15b949.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) dark blue silk tie at center (B) navy blue suit at center" }, { "from": "gpt", "value": "(B) navy blue suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20863a87fbba535f.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the blue denim jacket at lower center? (A) light blue hoodie at lower center (B) clear water at pond center" }, { "from": "gpt", "value": "(B) clear water at pond center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b381fa588b0164fd.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of red fabric flag at left in reference to blue fabric flag at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e4970e9920a7f40.jpg", "conversations": [ { "from": "human", "value": "\nIs brown sand at center positioned before green leafy tree at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown sand at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f28b2b95f91414c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear water at lower center is positioned above blue painted wood post at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, clear water at lower center is not positioned above blue painted wood post at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a10cd94170b7a6c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) black matte wooden horse at right (B) white plastic chair at left (C) white paper book at center (D) matte black jacket at center" }, { "from": "gpt", "value": "(A) black matte wooden horse at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0fe976aee49a834.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) plaid fabric snowsuit at lower left (B) white fluffy snow at center, is positioned farthest from the red fuzzy winter hat at upper right?" }, { "from": "gpt", "value": "(A) plaid fabric snowsuit at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb329df963bb2b37.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny brown horse at center positioned before purple fleece jacket at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of purple fleece jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c97d845e341b7043.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at upper left further to the viewer compared to green leafy tree at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37b951db390e2482.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red matte cargo ship at center is positioned to the left of white glossy boat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, red matte cargo ship at center is not to the left of white glossy boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f711cd30ab1a535a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white plastic fan at center is bigger than black matte fan at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white plastic fan at center has a larger size compared to black matte fan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efba6d8f0e0e7662.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green stone stele at center is positioned to the right of dark blue coat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green stone stele at center is not to the right of dark blue coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3efdcb34a0cb648c.jpg", "conversations": [ { "from": "human", "value": "\nIs black satin dress at center positioned at the back of white frosted cake at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26bf7318d96e6328.jpg", "conversations": [ { "from": "human", "value": "\nWhere is golden matte cloud at upper center located in relation to golden textured sky at upper left in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4509f19372358c7c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the brown wooden sign at center? Choose among these: (A) blue cotton shirt at center (B) red cotton shirt at center" }, { "from": "gpt", "value": "(B) red cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/327b834cbc5c7b01.jpg", "conversations": [ { "from": "human", "value": "\nIs flameflame-likefire at left bigger than white matte cowboy hat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, flameflame-likefire at left is not larger than white matte cowboy hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/744ccadce9a4e5c0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if olive-green coat at upper right is bigger than dark blue military uniform at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c26b5e07f52b7cb1.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of gray matte t-shirt at center and black suede baseball cap at upper left in the image provided, where is gray matte t-shirt at center located with respect to black suede baseball cap at upper left? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/524197bb1c95f21d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.955, 0.759) (B) (0.311, 0.916) (C) (0.723, 0.802)" }, { "from": "gpt", "value": "(A) (0.955, 0.759)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2fed0f95185a9ad2.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy hillside at lower center above green leafy tree at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green grassy hillside at lower center is not above green leafy tree at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a072fdce52aa42e2.jpg", "conversations": [ { "from": "human", "value": "\nDoes green fabric shirt at center appear on the left side of matte red hat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green fabric shirt at center is positioned on the left side of matte red hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fc63ed90d951953.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green grass at center (B) white marble column at center (C) white marble pillar at center (D) white matte sculpture at center" }, { "from": "gpt", "value": "(A) green grass at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/842ea09005d943d5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte brown mushroom at upper left (B) brown wood nut at upper left" }, { "from": "gpt", "value": "(A) matte brown mushroom at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09d755a7c211e95b.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the gray velvety sweater at lower right? (A) matte paper poster at center (B) cable-knit sweater at left (C) dark green jacket at center" }, { "from": "gpt", "value": "(C) dark green jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9fe948ed3ab80ca4.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the green fuzzy grass at center? Choose from: (A) green leafy tree at upper center (B) golden textured wheat at center" }, { "from": "gpt", "value": "(A) green leafy tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a47d570bf81f80c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white cotton t-shirt at lower left (B) brown matte jacket at upper right" }, { "from": "gpt", "value": "(B) brown matte jacket at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e9fb33624d18d68.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the matte black shirt at center? (A) silver metallic laptop at center (B) whiteboard at left" }, { "from": "gpt", "value": "(A) silver metallic laptop at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18119186d2c5387e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.744, 0.805) (B) (0.350, 0.523) (C) (0.531, 0.658)" }, { "from": "gpt", "value": "(B) (0.350, 0.523)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50246595d23b1d27.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark green textured tree at left appear over dirt path at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/613798df8b141a2c.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black hoodie at center come behind sleek silver laptop at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/923492cfc1078608.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow jersey at left appear on the left side of gray fabric shorts at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find yellow jersey at left to the left of gray fabric shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e37e4fea1e3040f.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden bridge at center positioned at the back of wooden planks at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f156e48f7c6f8de9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.398, 0.323) (B) (0.550, 0.312)" }, { "from": "gpt", "value": "(A) (0.398, 0.323)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f08ddd1176effad.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte black sweater at center located in relation to smooth plastic toy at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a286f08823208626.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the black matte swimsuit at lower left? Choose from: (A) wooden dock at center (B) matte black swimsuit at center (C) matte black life preserver at upper left" }, { "from": "gpt", "value": "(B) matte black swimsuit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af5cfa75e98ab6bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the white cotton shirt at upper right? Select from: (A) black cotton dress at center (B) white textured shirt at center" }, { "from": "gpt", "value": "(A) black cotton dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2375ec269e1e201.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of matte plastic table at center and green glass bottle at center in the image provided, where is matte plastic table at center located with respect to green glass bottle at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15baa9f9ab1ee465.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton shirt at lower right bigger than dark brown leather jacket at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white cotton shirt at lower right is not bigger than dark brown leather jacket at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34ee9232fa96f815.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.293, 0.608) (B) (0.470, 0.652) (C) (0.737, 0.608) (D) (0.219, 0.791)" }, { "from": "gpt", "value": "(C) (0.737, 0.608)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0817cb8b7d90410.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if pink fabric hairband at upper left is positioned below matte pink bow at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/067314c63fbdccb6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the gray fabric hair at center? Select from: (A) matte blue life vest at center (B) blue fabric shirt at center (C) white water at center" }, { "from": "gpt", "value": "(B) blue fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/756006b2f60916bb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy palm tree at upper right is positioned to the left of green leafy palm tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, green leafy palm tree at upper right is to the right of green leafy palm tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3baf8d3c158bacb4.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy bush at lower right closer to camera compared to shiny black car at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy bush at lower right is in front of shiny black car at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efcb5e6280c94764.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if silver metallic suv at lower right is positioned above silver metallic sedan at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d33aef0a1a4b566.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte black jacket at center located relative to clear glass martini at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d8f8daad6064287.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.476, 0.544) (B) (0.968, 0.959) (C) (0.000, 0.095) (D) (0.903, 0.102)" }, { "from": "gpt", "value": "(B) (0.968, 0.959)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb6f510b1fe97804.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the beige painted wall at center? (A) concrete sidewalk at lower center (B) white vinyl sign at upper center" }, { "from": "gpt", "value": "(B) white vinyl sign at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b99b8b51f813de0e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.131, 0.459) (B) (0.258, 0.444)" }, { "from": "gpt", "value": "(A) (0.131, 0.459)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0855abf90222de7a.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy laptop at center to the left of matte black glasses at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white glossy laptop at center is to the left of matte black glasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56ba5261b3870dd3.jpg", "conversations": [ { "from": "human", "value": "\nWhere is woven brown basket at lower left located in relation to shiny green bananas at upper right in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fe9d21f5cbdc332.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.604, 0.839) (B) (0.490, 0.853) (C) (0.584, 0.864) (D) (0.557, 0.864)" }, { "from": "gpt", "value": "(B) (0.490, 0.853)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8963be6ff3d485a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) metallic gray barrier at center (B) satin black suv at center (C) satin black truck at center, is positioned farthest from the glossy blue suv at center?" }, { "from": "gpt", "value": "(C) satin black truck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05e1219639968e51.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center closer to camera compared to purple matte shorts at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0187a2cd0dbda7c.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of blue water at center in relation to white smooth bird at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19c487dc2030e733.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte plastic magazine at center in relation to blonde synthetic wig at upper center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6911709647025b7.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) orange fleece jacket at left (B) light blue denim jeans at center (C) metallic wire mesh at upper center (D) light beige striped shirt at center" }, { "from": "gpt", "value": "(A) orange fleece jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4b44a321023c0b0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white striped shirt at left (B) floral fabric curtain at left" }, { "from": "gpt", "value": "(A) white striped shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6a60db6d814e1cc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white plastic badge at center is thinner than white cardstock ticket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white plastic badge at center is not thinner than white cardstock ticket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36959fa4e0bce303.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white shirt at lower right located relative to matte gold statue at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b71fdf9dc45124c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) black matte goggles at center (B) matte black snowboard at center (C) matte black snowboarder at center (D) snowy/icy mountain at upper center" }, { "from": "gpt", "value": "(B) matte black snowboard at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6896b99057037983.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of smooth black post at left in reference to polished metal lamp post at left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e20669477f12d148.jpg", "conversations": [ { "from": "human", "value": "\nDoes brushed red jacket at lower left appear on the left side of dark blue uniform at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find brushed red jacket at lower left to the left of dark blue uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc99298b9f118c39.jpg", "conversations": [ { "from": "human", "value": "\nIs red matte t-shirt at left smaller than matte red t-shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, red matte t-shirt at left might be larger than matte red t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5cfff4050eeabaf.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.174, 0.691) (B) (0.265, 0.666) (C) (0.657, 0.797)" }, { "from": "gpt", "value": "(C) (0.657, 0.797)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46d837c1c5c4c692.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) speckled fur dog at left (B) green matte plant at left (C) speckled fur dog at center" }, { "from": "gpt", "value": "(B) green matte plant at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb1ae9e8dcbadbd4.jpg", "conversations": [ { "from": "human", "value": "\nDoes metallic gray bookshelf at center have a larger size compared to white textured brick at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, metallic gray bookshelf at center has a larger size compared to white textured brick at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/074427ca434bbd2b.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray fabric shirt at center have a lesser width compared to beige straw hay at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, gray fabric shirt at center's width is less than beige straw hay at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21c373840e76ee9c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white sand at center is smaller than pastel pink fabric pants at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white sand at center is smaller than pastel pink fabric pants at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a5f308725a2d45b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) khaki cotton cap at upper right (B) black cotton t-shirt at center" }, { "from": "gpt", "value": "(A) khaki cotton cap at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a3c30398da7043a.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is blue floral swim trunks at center located relative to gold/yellow fabric bikini top at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78f0654647211741.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the black fabric bag at lower center? Choose from: (A) white fabric shirt at lower center (B) white matte arm at center" }, { "from": "gpt", "value": "(B) white matte arm at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76a20ab0ba0bdac6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) black plastic pen at center (B) dark brown corduroy jacket at center (C) blue denim jeans at center (D) white glossy phone at upper right" }, { "from": "gpt", "value": "(D) white glossy phone at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce411066836cada6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.785, 0.270) (B) (0.058, 0.178)" }, { "from": "gpt", "value": "(A) (0.785, 0.270)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a41ef46245e6bfb.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of rusty metal grate at center in reference to white plastic sign at upper center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8342f2037d542286.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth concrete pavement at center appear on the left side of beige fabric coat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, smooth concrete pavement at center is not on the left side of beige fabric coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/747f5ed5f71685b7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) blue denim jacket at lower right (B) beige fabric jacket at lower right" }, { "from": "gpt", "value": "(B) beige fabric jacket at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/985c3a5e0e7b3920.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.980, 0.756) (B) (0.424, 0.691)" }, { "from": "gpt", "value": "(A) (0.980, 0.756)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/393e0dcfc9047802.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) wet fur dog at center (B) white fluffy snow at center, is positioned closest to the smooth bark tree at upper right?" }, { "from": "gpt", "value": "(B) white fluffy snow at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/754f2a14e272f115.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte shirt at center is smaller than matte white shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white matte shirt at center is smaller than matte white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/795ac94da6e75669.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black plush toy at left located in relation to brown plush bear at upper center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f2d004c973fecf3.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow plush costume at center to the left of velvet black costume at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, yellow plush costume at center is not on the left side of velvet black costume at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff03c4c94273e155.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) checkered fabric shirt at center (B) red and white fabric flag at left (C) floral fabric dress at center" }, { "from": "gpt", "value": "(C) floral fabric dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d986a13efb1cad2c.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of red matte ski at lower right and red fabric snowboarder at lower right in the image provided, where is red matte ski at lower right located with respect to red fabric snowboarder at lower right? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9540171e21ff6134.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is glossy black sedan at center located relative to silver metallic hatchback at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db33c6d9056fa563.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent glass fountain at center further to camera compared to white glossy fountain at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9673f18726a0fbbb.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the blue glossy balloon at upper right? (A) plaid fabric shirt at left (B) black matte glasses at center" }, { "from": "gpt", "value": "(A) plaid fabric shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/319d126c566446a6.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the brown paper bulletin board at right? Choose from: (A) white paper at center (B) dark brown hair at upper left" }, { "from": "gpt", "value": "(B) dark brown hair at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99c8c4c33c184625.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte shirt at center to the right of matte black hair at lower right from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white matte shirt at center is not to the right of matte black hair at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e126f875a3cd9aa7.jpg", "conversations": [ { "from": "human", "value": "\nIs red matte train at center below yellow/black striped pole at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe20f2e94cda34ba.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte gray backpack at lower left appear on the left side of matte blue backpack at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte gray backpack at lower left is not to the left of matte blue backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90a2e4bc8df48a1c.jpg", "conversations": [ { "from": "human", "value": "\nIs brown wool suit at center positioned before matte brown suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown wool suit at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b789e905e54889e.jpg", "conversations": [ { "from": "human", "value": "\nDoes rainbow leggings at center have a smaller size compared to blue uniform at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, rainbow leggings at center has a smaller size compared to blue uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/281ae62160ab7f26.jpg", "conversations": [ { "from": "human", "value": "\nIs brown sandy dirt track at center thinner than white fluffy dog at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b32d870d6fe52662.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray sweater at center lie in front of blonde hair at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is behind blonde hair at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cdcc3a892e42a373.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the matte black hair at upper left? Select from: (A) smooth black hair at center (B) blue checkered tablecloth at lower center" }, { "from": "gpt", "value": "(B) blue checkered tablecloth at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14f1c90cb586f854.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.336, 0.773) (B) (0.110, 0.075)" }, { "from": "gpt", "value": "(B) (0.110, 0.075)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f56dbf1e890ea24.jpg", "conversations": [ { "from": "human", "value": "\nIs floral cotton dress at center bigger than wooden bench at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, floral cotton dress at center is not bigger than wooden bench at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d18667ff87e66dd.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black and white striped dress at center is positioned above black glossy laptop at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, black and white striped dress at center is located above black glossy laptop at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5c41aa4f3180f26.jpg", "conversations": [ { "from": "human", "value": "\nIs black leather jacket at upper left to the right of gray beard at right from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, black leather jacket at upper left is not to the right of gray beard at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/091ba298b013ae55.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.253, 0.927) (B) (0.438, 0.714)" }, { "from": "gpt", "value": "(B) (0.438, 0.714)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5a2d712561e0224.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.035, 0.202) (B) (0.013, 0.653) (C) (0.430, 0.838) (D) (0.920, 0.267)" }, { "from": "gpt", "value": "(D) (0.920, 0.267)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/736d68d5854d82e7.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear blue water at lower center have a larger size compared to denim jacket at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, clear blue water at lower center has a larger size compared to denim jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ad311a9cf025234.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) gray wool suit at center (B) matte black dress at lower left" }, { "from": "gpt", "value": "(B) matte black dress at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/544e1086b45b817f.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the white soft cloth at center? (A) knitted dark blue sweater at center (B) black felt hat at upper center" }, { "from": "gpt", "value": "(A) knitted dark blue sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee650db9ff04cc8f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) rusty concrete bridge at upper center (B) white metallic fire truck at center (C) silver metallic truck at center" }, { "from": "gpt", "value": "(A) rusty concrete bridge at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f37f9d17e8a31fa.jpg", "conversations": [ { "from": "human", "value": "\nDoes gold textured curtain at upper left appear on the left side of gold textured curtain at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, gold textured curtain at upper left is not to the left of gold textured curtain at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/327df1425f37b5d6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden cabin at center is wider than green fabric tent at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, wooden cabin at center is wider than green fabric tent at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdfbe7e35f7a8d0c.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of dark brown t-shirt at center in reference to light blue denim shorts at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4b6e301216e191e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) silver metallic bolt at center (B) metallic brake rotor at center" }, { "from": "gpt", "value": "(A) silver metallic bolt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6eae34347287a41e.jpg", "conversations": [ { "from": "human", "value": "\nDoes speckled feathered turkey at center have a smaller size compared to speckled feathered turkey at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, speckled feathered turkey at center is not smaller in size than speckled feathered turkey at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6fcc5f22ad5908df.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white fluffy cloud at upper left (B) gold textured tower at center" }, { "from": "gpt", "value": "(A) white fluffy cloud at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98e40d90b7e09d62.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy hillside at center appear on the left side of gray rough rock at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green leafy hillside at center is not to the left of gray rough rock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cb61b1501f3bd56.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte fabric woman at upper left located relative to white soft pillow at upper center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1aa6bc9ad5f65e08.jpg", "conversations": [ { "from": "human", "value": "\nIs white paper billboard at center positioned in front of shiny chrome beach ball at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white paper billboard at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73dea5da926935c6.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of wire mesh fence at center less distant than that of yellow-green spotted leaf at center-right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, wire mesh fence at center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18b5d60f8ed15aad.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green matte cucumber at lower left (B) matte plastic strawberry at center left (C) orange plastic bottle at upper right" }, { "from": "gpt", "value": "(C) orange plastic bottle at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57c7831945999578.jpg", "conversations": [ { "from": "human", "value": "\nIs matte white hand at center positioned before matte skin hand at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/caad0774f86b44e7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) matte black jacket at center (B) black matte cap at upper right (C) black fabric baseball cap at upper right" }, { "from": "gpt", "value": "(A) matte black jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7933e9ed14549ae6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if mahogany wood door at center is positioned to the right of white plastic sign at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, mahogany wood door at center is to the left of white plastic sign at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a496e189fae470b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.884, 0.866) (B) (0.285, 0.762) (C) (0.475, 0.386) (D) (0.053, 0.997)" }, { "from": "gpt", "value": "(D) (0.053, 0.997)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76e24ac6b229da6f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.311, 0.306) (B) (0.207, 0.250)" }, { "from": "gpt", "value": "(A) (0.311, 0.306)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3c0aed055ba8b6a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.061, 0.377) (B) (0.919, 0.883) (C) (0.450, 0.845)" }, { "from": "gpt", "value": "(C) (0.450, 0.845)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13698ea19858d77e.jpg", "conversations": [ { "from": "human", "value": "\nDoes light blue fabric suit at center have a larger size compared to green sweater at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, light blue fabric suit at center is larger in size than green sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61f3fc212e0603c6.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.009, 0.875) (B) (0.321, 0.903)" }, { "from": "gpt", "value": "(B) (0.321, 0.903)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c1599e83e1585dd.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the hawaiian print shirt at center from the following options: (A) pink fabric shirt at left (B) teal fabric shirt at center (C) dark blue shirt at center (D) dark blue fabric jacket at center?" }, { "from": "gpt", "value": "(D) dark blue fabric jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a7cc539c66f391d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.539, 0.439) (B) (0.423, 0.380)" }, { "from": "gpt", "value": "(A) (0.539, 0.439)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77c782ad6ad345a6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) dirt/gravel path at center (B) brick wall at right" }, { "from": "gpt", "value": "(A) dirt/gravel path at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8508ae38547b9d24.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black textured coat at center is positioned to the right of smooth skin at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, black textured coat at center is to the left of smooth skin at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4225423cce31b23c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte trees at upper center is wider than matte black backpack at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/004da084748d5392.jpg", "conversations": [ { "from": "human", "value": "\nIs white shirt at lower right to the right of shiny green bird at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white shirt at lower right is to the right of shiny green bird at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/988a72e7188dec3a.jpg", "conversations": [ { "from": "human", "value": "\nIs green textured hill at center positioned in front of brown dirt track at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is behind brown dirt track at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed8b5791aee9774e.jpg", "conversations": [ { "from": "human", "value": "\nIs white smooth arrow at center to the left of matte orange pillar at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white smooth arrow at center is not on the left side of matte orange pillar at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e13bcff208fff3e.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of red matte umbrella at center in reference to matte black umbrella at upper right? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9cfbcef2a317bd7a.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center to the right of matte black glasses at upper left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green leafy tree at center is not to the right of matte black glasses at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b6ff9fc1f4b615c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte gray backpack at center is positioned to the left of gray fabric backpack at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find matte gray backpack at center to the left of gray fabric backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6353907b1cf89a0c.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of pink fabric baby at lower center more distant than that of wooden pole at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d4e113cf67ac130.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black leather jacket at left appear over matte black fedora at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aff1c6fd11dde229.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) glossy red car at center (B) white plastic license plate at center" }, { "from": "gpt", "value": "(A) glossy red car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/412334e18f20071e.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of dark green military uniform at right and velvet gold uniform at center in the image provided, where is dark green military uniform at right located with respect to velvet gold uniform at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a62746bd83e3dc7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) white fabric spacesuit at left (B) brown cotton shirt at center (C) black matte shirt at center" }, { "from": "gpt", "value": "(B) brown cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d7c129be9185e7b.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy table at center thinner than black textured sweater at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, white glossy table at center might be wider than black textured sweater at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a19193d9f7872252.jpg", "conversations": [ { "from": "human", "value": "\nIs white paper certificate at center smaller than wooden picnic table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white paper certificate at center is not smaller in size than wooden picnic table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/112fe35e9f44540e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.675, 0.903) (B) (0.840, 0.523) (C) (0.803, 0.678)" }, { "from": "gpt", "value": "(B) (0.840, 0.523)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b475ce45aa414a14.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) denim overalls at center (B) green denim overalls at center (C) striped cotton shirt at left (D) white cotton shirt at center" }, { "from": "gpt", "value": "(D) white cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d51b4fc38f3fe540.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black figure at upper right thinner than white matte leg at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6a619d234ad8683.jpg", "conversations": [ { "from": "human", "value": "\nIs maroon shirt at center smaller than white fabric flag at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/933709d84d989c0e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.450, 0.409) (B) (0.464, 0.164) (C) (0.478, 0.084)" }, { "from": "gpt", "value": "(B) (0.464, 0.164)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de7d6bfb235ee723.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.665, 0.750) (B) (0.789, 0.414) (C) (0.686, 0.472)" }, { "from": "gpt", "value": "(B) (0.789, 0.414)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bda08eb1c62d9db.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black jersey at center is positioned to the right of blue jersey at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, matte black jersey at center is to the left of blue jersey at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4cb65ccd02e6cc1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if knitted wool beanie at upper right is wider than blue metal chair at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, knitted wool beanie at upper right has a greater width compared to blue metal chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4349ede9a38d8fd4.jpg", "conversations": [ { "from": "human", "value": "\nDoes rusty wood dock at center have a lesser width compared to matte black jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2391ad87a32f3281.jpg", "conversations": [ { "from": "human", "value": "\nIs black satin dress at center below gray hoodie at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black satin dress at center is not below gray hoodie at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1bf5da2b68e848a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.872, 0.195) (B) (0.710, 0.180) (C) (0.756, 0.537)" }, { "from": "gpt", "value": "(C) (0.756, 0.537)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5f7b6df8eaa9d58.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) striped cotton shirt at left (B) gray fleece jacket at center (C) blue hoodie at center (D) matte gray hoodie at center" }, { "from": "gpt", "value": "(A) striped cotton shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66191bd26f15385e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the matte black jacket at left? (A) matte black flag at upper left (B) white matte soccer uniforms at center" }, { "from": "gpt", "value": "(B) white matte soccer uniforms at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a949bee9f35cfa07.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy boat at center is positioned below clear water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white glossy boat at center is below clear water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/610e00a4f35fa0ab.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) black velvet gown at center (B) black matte graduation gown at center (C) matte black graduation gown at center" }, { "from": "gpt", "value": "(A) black velvet gown at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12419dc35795d29e.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white matte bus at center and red sweater at center in the image provided, where is white matte bus at center located with respect to red sweater at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a1b6195d0ea7978.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.674, 0.995) (B) (0.236, 0.300)" }, { "from": "gpt", "value": "(A) (0.674, 0.995)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5b8a36bf8c18555.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.420, 0.520) (B) (0.079, 0.311) (C) (0.339, 0.620)" }, { "from": "gpt", "value": "(B) (0.079, 0.311)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d736d91292c7041.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown donkey at center closer to camera compared to wooden bench at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte brown donkey at center is in front of wooden bench at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfe392d2908e04f8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.520, 0.342) (B) (0.350, 0.964)" }, { "from": "gpt", "value": "(A) (0.520, 0.342)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f3fe982e6d1ed60.jpg", "conversations": [ { "from": "human", "value": "\nDoes glossy reflective water at center have a lesser width compared to matte gray mountain at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5301ca65bcd20750.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the black silk suit at upper right among (A) black leather jacket at center (B) shiny dark blue suit at center?" }, { "from": "gpt", "value": "(B) shiny dark blue suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed7044d4caf24e56.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.665, 0.620) (B) (0.319, 0.613)" }, { "from": "gpt", "value": "(B) (0.319, 0.613)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ec30a8ef73e0d5a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the black matte helmet at center? Choose among these: (A) matte black goggles at center (B) glossy black mirror at center" }, { "from": "gpt", "value": "(B) glossy black mirror at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c84550354845b57b.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray wool coat at center bigger than light brown leather jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f13a7a79f3fa5b6.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of purple soft fabric baby at center in reference to teal sweater at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69d8d14f8f0c3ea6.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of brown murky water at center in relation to light gray concrete houseboat at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4286b2a2db9911da.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.578, 0.887) (B) (0.011, 0.791) (C) (0.992, 0.530)" }, { "from": "gpt", "value": "(A) (0.578, 0.887)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc48d414a3a3d73e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the black puffy jacket at center? (A) dark brown hair at upper center (B) black matte jacket at left (C) blue crystal pendant at upper center" }, { "from": "gpt", "value": "(A) dark brown hair at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/460596216829a060.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink fabric skirt at center have a greater width compared to white plastic projector at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, pink fabric skirt at center has a greater width compared to white plastic projector at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b66c5d756fee6e80.jpg", "conversations": [ { "from": "human", "value": "\nIs brown stone clock tower at center further to camera compared to gold textured clock at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cb76fdbd3d3ec78.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.910, 0.989) (B) (0.668, 0.852)" }, { "from": "gpt", "value": "(B) (0.668, 0.852)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c577e98cee20c324.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte pink robe at left is positioned to the left of matte pink silk robe at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte pink robe at left is to the left of matte pink silk robe at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c14b1e17ff7bc4a8.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte t-shirt at left bigger than white cardboard at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, black matte t-shirt at left is larger in size than white cardboard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6caffccfa9249ab.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.444, 0.836) (B) (0.250, 0.616)" }, { "from": "gpt", "value": "(A) (0.444, 0.836)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d68ee67b0f8a184.jpg", "conversations": [ { "from": "human", "value": "\nIs metal train track at center bigger than yellow cotton sari at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, metal train track at center is larger in size than yellow cotton sari at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b836f9b9c79eb44c.jpg", "conversations": [ { "from": "human", "value": "\nIs natural straw skirt at center wider than black woven grass skirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, natural straw skirt at center has a greater width compared to black woven grass skirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fe3478e7db4ab77.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) red fabric jacket at lower left (B) matte black bookshelf at lower left" }, { "from": "gpt", "value": "(A) red fabric jacket at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa16f9636350ed1d.jpg", "conversations": [ { "from": "human", "value": "\nIs denim jacket at upper left above white fabric baseball cap at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, denim jacket at upper left is not above white fabric baseball cap at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0521e600836c838.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) metallic chain-link fence at upper right (B) shiny brown puppy at center" }, { "from": "gpt", "value": "(B) shiny brown puppy at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f5f6d11958d5654.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.879, 0.639) (B) (0.244, 0.734)" }, { "from": "gpt", "value": "(A) (0.879, 0.639)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c314a492074c069b.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the white checkered shirt at center? Choose from: (A) blue checkered shirt at center (B) blue cotton shirt at center" }, { "from": "gpt", "value": "(A) blue checkered shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/407168f8840071a8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the pink matte ice cream cone at upper right? Choose among these: (A) leather pants at left (B) jeans at center (C) chocolate matte ice cream cone at upper right" }, { "from": "gpt", "value": "(B) jeans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95026177b459c264.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if camouflage quilted jacket at center is positioned to the left of yellow plastic slide at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find camouflage quilted jacket at center to the left of yellow plastic slide at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed25b1f776759304.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.550, 0.619) (B) (0.319, 0.586) (C) (0.864, 0.658)" }, { "from": "gpt", "value": "(B) (0.319, 0.586)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e3d0d6974dd005c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if cloudy sky at upper center is thinner than dark blue water at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cce3bbeb66b82c20.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.202, 0.362) (B) (0.440, 0.170) (C) (0.619, 0.972) (D) (0.734, 0.339)" }, { "from": "gpt", "value": "(C) (0.619, 0.972)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f775c26da8ad00f.jpg", "conversations": [ { "from": "human", "value": "\nDoes light beige shirt at lower left appear on the left side of light brown hair at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, light beige shirt at lower left is positioned on the left side of light brown hair at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/472b9f56d3932476.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) blue fabric shirt at lower right (B) green grass at center, is positioned closest to the matte black backpack at center-right?" }, { "from": "gpt", "value": "(A) blue fabric shirt at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74c9b899a5611fbc.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of matte brown shirt at center in reference to wooden at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cce73d13e87da61f.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue cotton shirt at center lie in front of white cotton shirt at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f748e0fed868eefe.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white matte jersey at center (B) white jersey at center" }, { "from": "gpt", "value": "(B) white jersey at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e448125517a58148.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) floral print fabric dress at left (B) floral fabric dress at center" }, { "from": "gpt", "value": "(B) floral fabric dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0f73b13aa6efe67.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.203, 0.384) (B) (0.833, 0.339) (C) (0.279, 0.602) (D) (0.652, 0.419)" }, { "from": "gpt", "value": "(B) (0.833, 0.339)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/312525ce05c2f152.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte brown backpack at center located relative to dark green fabric jacket at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/415d3df4fab7be57.jpg", "conversations": [ { "from": "human", "value": "\nIs orange fabric jacket at center to the right of orange fleece jacket at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, orange fabric jacket at center is positioned on the right side of orange fleece jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fe91b3ec35355b3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) snowy rocky peak at left (B) cloudy textured mountain at upper center (C) rugged stone mountain range at center" }, { "from": "gpt", "value": "(B) cloudy textured mountain at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d994f84e19b7ff62.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is bare wood tree at upper right located relative to green fabric vest at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53ba48e434617a64.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the gray rough stone at right among (A) green matte leafy branch at upper left (B) green matte leafy branch at upper center?" }, { "from": "gpt", "value": "(B) green matte leafy branch at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73e8cfb5bd07bc08.jpg", "conversations": [ { "from": "human", "value": "\nDoes translucent glass orbs at center have a greater width compared to gray stone pole at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfeded6b8a538bbf.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white woolen sweater at upper left is wider than patterned wool scarf at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62402cdcf5cfce2b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) gray stone bell tower at center (B) autumn leaves at center (C) autumn leaves at left, is positioned farthest from the brown leafy tree at center?" }, { "from": "gpt", "value": "(C) autumn leaves at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44b6a3f2db356162.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the dark green uniform at lower left from the following options: (A) wooden shack at lower right (B) black matte figure at center?" }, { "from": "gpt", "value": "(B) black matte figure at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/360abe4e47b285d4.jpg", "conversations": [ { "from": "human", "value": "\nIs orange matte sign at upper center to the left of orange matte sign at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, orange matte sign at upper center is not to the left of orange matte sign at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/244357035796952b.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue cotton shirt at upper right come behind smooth skin face at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f7d2e6db8cbd7b2.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown glossy horse at left appear under black rubber nose at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, brown glossy horse at left is not positioned below black rubber nose at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82a87d6618bd4515.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) light beige jacket at lower left (B) light beige pedestrians at lower center (C) light brown leather jacket at center (D) dark gray sweater at lower left" }, { "from": "gpt", "value": "(B) light beige pedestrians at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b322e115a8c139d5.jpg", "conversations": [ { "from": "human", "value": "\nIs red-white-blue fabric flag at right smaller than white plastic cup at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, red-white-blue fabric flag at right is not smaller than white plastic cup at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69f63b2a12ccead3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) blue tie-dye shirt at right (B) blonde hair at center" }, { "from": "gpt", "value": "(A) blue tie-dye shirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65ddd4e5263a4ec2.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte white shirt at left appear under matte green hand at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte white shirt at left is below matte green hand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0f229d75118f683.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white softshell jacket at center is positioned below tan fabric hat at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08920f5d3dcf9f2b.jpg", "conversations": [ { "from": "human", "value": "\nDoes white plastic exhaust hood at upper left appear over white glossy drawer at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white plastic exhaust hood at upper left is positioned over white glossy drawer at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c010af9587fdfc6e.jpg", "conversations": [ { "from": "human", "value": "\nDoes camouflage fabric uniform at center appear under matte black video camera at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, camouflage fabric uniform at center is not below matte black video camera at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bbd6981d2433fd9.jpg", "conversations": [ { "from": "human", "value": "\nIs white fluffy snow at lower center to the right of dark matte jacket at left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find white fluffy snow at lower center to the right of dark matte jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35a430f4d2f4ab69.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.505, 0.744) (B) (0.392, 0.634)" }, { "from": "gpt", "value": "(B) (0.392, 0.634)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a12a760d70f6608b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) black matte sunglasses at left (B) plaid scarf at center (C) matte black sunglasses at left (D) dark blue jacket at center" }, { "from": "gpt", "value": "(D) dark blue jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c554c469a99fc50.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown sandy dirt road at center is smaller than brown wooden pole at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, brown sandy dirt road at center has a smaller size compared to brown wooden pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db8c75b32dbee867.jpg", "conversations": [ { "from": "human", "value": "\nIs white concrete pavement at center smaller than dark gray metal pole at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, white concrete pavement at center might be larger than dark gray metal pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/201010972fb7ea62.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.161, 0.978) (B) (0.219, 0.044) (C) (0.453, 0.125)" }, { "from": "gpt", "value": "(B) (0.219, 0.044)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bdbec78fb1b4d08.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.072, 0.708) (B) (0.200, 0.431) (C) (0.572, 0.920) (D) (0.233, 0.852)" }, { "from": "gpt", "value": "(D) (0.233, 0.852)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e073a86351ae57f6.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown furry deer at center appear under brown fur deer at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6caa77816dd4ab88.jpg", "conversations": [ { "from": "human", "value": "\nWhere is orange fleece jacket at center right located in relation to light brown fabric jacket at lower left in the image? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04a28c49050884b3.jpg", "conversations": [ { "from": "human", "value": "\nDoes denim shirt at left have a smaller size compared to gray woolen cardigan at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, denim shirt at left occupies less space than gray woolen cardigan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1403567c4b4e1b25.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white textured bench at center and polished stainless steel elevator at left in the image provided, where is white textured bench at center located with respect to polished stainless steel elevator at left? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d02016fff3cd4e54.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte red cube at left is positioned to the right of blue matte toy at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte red cube at left is not to the right of blue matte toy at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f7ea9f6d90fb852.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) green felt billiard table at center (B) purple matte table tennis at center" }, { "from": "gpt", "value": "(A) green felt billiard table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b7a2ae4705f5846.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) blue denim pants at left (B) printed fabric shirt at center (C) maroon matte car at left, is positioned farthest from the white glossy sedan at center?" }, { "from": "gpt", "value": "(A) blue denim pants at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc67e8c550029144.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the white textured bench at center among (A) textured beige sweater at center (B) concrete bench at center?" }, { "from": "gpt", "value": "(A) textured beige sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40b4fdd2ca55ebf8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.388, 0.141) (B) (0.529, 0.056)" }, { "from": "gpt", "value": "(A) (0.388, 0.141)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b878b6039c53f7ac.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) white fabric backpack at center (B) light blue t-shirt at lower left" }, { "from": "gpt", "value": "(B) light blue t-shirt at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10320f27034e6746.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic blue sedan at lower left is wider than metallic blue car at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of metallic blue sedan at lower left exceeds that of metallic blue car at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5720cbffaa8c559.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the black chalkboard specials at upper center among (A) brown wood table at center (B) gray cotton shirt at right (C) dark brown leather chair at right (D) matte red shirt at center?" }, { "from": "gpt", "value": "(D) matte red shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/079a6948acf10f96.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the dark wool coat at center among (A) dark brown leather jacket at center (B) green matte tree at left (C) brick pavement at center (D) dark brown leather coat at center?" }, { "from": "gpt", "value": "(B) green matte tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aecafcd6cce44448.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) matte red swim trunks at center (B) red fabric shorts at lower left (C) matte red baseball cap at upper center" }, { "from": "gpt", "value": "(A) matte red swim trunks at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ddf6ea52de457cf.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brick stone castle at center (B) green leafy tree at upper center (C) green leafy hedge at left (D) green leafy tree at left" }, { "from": "gpt", "value": "(A) brick stone castle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/653b5f3e73cd1d93.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cotton shirt at center is positioned below silver metallic laptop at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16351b0fce316885.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.683, 0.097) (B) (0.354, 0.248) (C) (0.815, 0.030) (D) (0.951, 0.645)" }, { "from": "gpt", "value": "(D) (0.951, 0.645)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31a3bdbaa8cafc44.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) illuminated plastic tree at center (B) black matte christmas tree at lower left (C) illuminated plastic tree at upper left" }, { "from": "gpt", "value": "(B) black matte christmas tree at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18887018673d45a6.jpg", "conversations": [ { "from": "human", "value": "\nIs clear blue water at center in front of metallic gray folding chair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is behind metallic gray folding chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08ed94efe7309458.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) red matte shirt at center (B) green stone water at lower left" }, { "from": "gpt", "value": "(B) green stone water at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c921d7602e1106b2.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped fabric at lower center appear on the left side of fuzzy dark brown dog at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, striped fabric at lower center is not on the left side of fuzzy dark brown dog at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b19483cc119aa19.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red fabric shirt at center is positioned above black fabric flag at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d5bca150cb4e712.jpg", "conversations": [ { "from": "human", "value": "\nIs floral fabric skirt at left closer to camera compared to matte cardboard box at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, floral fabric skirt at left is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2a84c208c4a239b.jpg", "conversations": [ { "from": "human", "value": "\nIs matte white kimono doll at center below matte red platter at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3089f09c70ba618e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.153, 0.539) (B) (0.180, 0.537)" }, { "from": "gpt", "value": "(A) (0.153, 0.539)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b81b7519f038fef8.jpg", "conversations": [ { "from": "human", "value": "\nDoes black wrought iron fence at lower center appear under stone tower at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2331c7659f4d27e1.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of black suit at center less distant than that of orange striped tie at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a2ed91c30ab3399.jpg", "conversations": [ { "from": "human", "value": "\nIs white sandy beach at lower center to the right of wooden fence at lower center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white sandy beach at lower center is to the right of wooden fence at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcfe71161aae122b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if neon yellow tank top at center is bigger than matte black tank top at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, neon yellow tank top at center has a larger size compared to matte black tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2be11de3cc19676.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of black paper at left and matte black rifle at center in the image provided, where is black paper at left located with respect to matte black rifle at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c02da8e48b1121e6.jpg", "conversations": [ { "from": "human", "value": "\nIs gray rock at center to the right of brown dry grass at right from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, gray rock at center is not to the right of brown dry grass at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96d27873bb74e352.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny yellow and black fish at center is wider than shiny blue and yellow fish at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, shiny yellow and black fish at center might be narrower than shiny blue and yellow fish at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/211e8ad9e12b0821.jpg", "conversations": [ { "from": "human", "value": "\nDoes satin blue stone at center lie behind blue glass stone at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, satin blue stone at center is behind blue glass stone at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3aed7fb198f62e4a.jpg", "conversations": [ { "from": "human", "value": "\nIs autumn leaves at center smaller than matte orange tree at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, autumn leaves at center might be larger than matte orange tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c56eef6d94680598.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is pink plaid shirt at left located relative to blue jeans at lower right? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3062f8a1ab18a309.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) smooth brown jacket at upper left (B) plaid shirt at lower right" }, { "from": "gpt", "value": "(A) smooth brown jacket at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8214483f7a189c4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.759, 0.898) (B) (0.400, 0.152)" }, { "from": "gpt", "value": "(A) (0.759, 0.898)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/868bddd49b24df52.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.233, 0.873) (B) (0.377, 0.802) (C) (0.579, 0.681) (D) (0.070, 0.986)" }, { "from": "gpt", "value": "(D) (0.070, 0.986)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b275d0c607259b5.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte blinds at upper center have a greater width compared to tropical fabric curtain at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of green matte blinds at upper center exceeds that of tropical fabric curtain at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82e2553928f4d0dc.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) blue water at center (B) white wooden sailboat at center (C) white wooden boat at center" }, { "from": "gpt", "value": "(C) white wooden boat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44599a8a8fec0fe9.jpg", "conversations": [ { "from": "human", "value": "\nIs brown dry grass at center further to camera compared to glossy brown giraffe at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cafe1b11b61042a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the illuminated glass christmas tree at left? (A) dark gray jacket at lower center (B) polished bronze lion at center" }, { "from": "gpt", "value": "(B) polished bronze lion at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a81d03c16ade405.jpg", "conversations": [ { "from": "human", "value": "\nIs brown fuzzy donkey at upper center smaller than white woolen sheep at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, brown fuzzy donkey at upper center might be larger than white woolen sheep at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/201c5f10164cd2e7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) gray fabric jacket at lower right (B) metallic silver chair at lower center (C) blue fabric jacket at right (D) matte gray desk at center" }, { "from": "gpt", "value": "(B) metallic silver chair at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/246a3df93ea645c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte black chair at center (B) clear glass pool at center" }, { "from": "gpt", "value": "(B) clear glass pool at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20666aa20de3c9f1.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of black fabric at lower right and black plastic projector at lower center in the image provided, where is black fabric at lower right located with respect to black plastic projector at lower center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa46adace54f21d6.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) yellow matte shirt at right (B) green striped sweater at center" }, { "from": "gpt", "value": "(A) yellow matte shirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7de87d3470dd7f6c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) black leather jacket at center (B) white powdery snow at center" }, { "from": "gpt", "value": "(B) white powdery snow at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b77e67b0f3e70dd.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte pink flower at center appear under smooth red flower at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte pink flower at center is below smooth red flower at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/775d29467d37873b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.863, 0.786) (B) (0.309, 0.733)" }, { "from": "gpt", "value": "(A) (0.863, 0.786)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/685a2ef8fed6c5a9.jpg", "conversations": [ { "from": "human", "value": "\nDoes green mossy log at center have a greater width compared to green leafy fern at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of green mossy log at center exceeds that of green leafy fern at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f9c46e6a9a50ca4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) gold metallic bracelet at center (B) wooden polished table at center" }, { "from": "gpt", "value": "(B) wooden polished table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/422d36c71e130360.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the shiny plastic plate at lower left? Choose from: (A) red plastic table at center (B) pink fabric bib at upper right" }, { "from": "gpt", "value": "(A) red plastic table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd7cf4b4a8909a2e.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric tank top at center positioned in front of gray cotton t-shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, blue fabric tank top at center is behind gray cotton t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a4093e51196b139.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center appear over green wrought iron fence at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green leafy tree at center is positioned over green wrought iron fence at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f7ac0daca679938.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden bench at lower left have a larger size compared to brown leather jacket at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e74326c049d33ed1.jpg", "conversations": [ { "from": "human", "value": "\nIs gray metallic truck at center below wooden ladder at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, gray metallic truck at center is positioned under wooden ladder at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73895a3dafed264a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.361, 0.781) (B) (0.417, 0.350) (C) (0.104, 0.953)" }, { "from": "gpt", "value": "(A) (0.361, 0.781)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15cabbf566ae2565.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) green leafy tree at upper center (B) dark brown wooden stairs at lower center" }, { "from": "gpt", "value": "(B) dark brown wooden stairs at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29aa910fbd528bad.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.696, 0.747) (B) (0.299, 0.347)" }, { "from": "gpt", "value": "(A) (0.696, 0.747)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53dd68e48ef39253.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the black fabric backpack at center? Choose from: (A) white matte shirt at center (B) white matte jacket at lower center (C) black leather jacket at lower left" }, { "from": "gpt", "value": "(B) white matte jacket at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30b75ff384f64b3c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at center is positioned above green grass at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/145a9197223c44c2.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) metallic silver car at center (B) transparent glass door at center" }, { "from": "gpt", "value": "(A) metallic silver car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96100427b1183760.jpg", "conversations": [ { "from": "human", "value": "\nIs dark concrete skate park at center positioned at the back of dark blue jeans at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dark concrete skate park at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b1b7c613fc21046.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) metallic tambourine at left (B) teal metallic guitar at right, is positioned closest to the smooth skin face at upper right?" }, { "from": "gpt", "value": "(B) teal metallic guitar at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/939bc65358d69af9.jpg", "conversations": [ { "from": "human", "value": "\nIs blue glossy fish at center to the right of matte brown rock at lower center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, blue glossy fish at center is not to the right of matte brown rock at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf6dd8fb4df7caae.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy hillside at upper left is wider than wooden cabin at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy hillside at upper left is wider than wooden cabin at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd6cb0e11dc2f1c9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.459, 0.178) (B) (0.647, 0.550) (C) (0.977, 0.167)" }, { "from": "gpt", "value": "(A) (0.459, 0.178)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c16af8ea3fc5142b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.155, 0.314) (B) (0.562, 0.317) (C) (0.328, 0.450)" }, { "from": "gpt", "value": "(B) (0.562, 0.317)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/004b42d9ce150b46.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of light brown hair at center in relation to light gray hoodie at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6239241699f1bb4.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at right bigger than white smooth column at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green leafy tree at right has a larger size compared to white smooth column at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/313c8046d46a8af8.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown fabric jacket at center appear over plastic water bottle at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, brown fabric jacket at center is located above plastic water bottle at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfabe8fc21666821.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) matte black gloves at upper left (B) white fuzzy pants at center" }, { "from": "gpt", "value": "(A) matte black gloves at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bd142a4db3598ab.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.459, 0.225) (B) (0.035, 0.295) (C) (0.376, 0.191)" }, { "from": "gpt", "value": "(C) (0.376, 0.191)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65f3f1f2a2f3c37c.jpg", "conversations": [ { "from": "human", "value": "\nIs black fabric at right to the left of green fabric jacket at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, black fabric at right is to the right of green fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ef66e8528ed45eb.jpg", "conversations": [ { "from": "human", "value": "\nIs bronze statue at center bigger than bronze statue of child at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d90f53fee02d750f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.233, 0.516) (B) (0.923, 0.417)" }, { "from": "gpt", "value": "(B) (0.923, 0.417)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd45fb3fa62a038b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown matte scarf at upper left is smaller than clear plastic glasses at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, brown matte scarf at upper left is not smaller than clear plastic glasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1f65e49a790c113.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the light green fabric baby at center? (A) camouflage fabric uniform at center (B) multicolored plastic toy at center" }, { "from": "gpt", "value": "(A) camouflage fabric uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffafd81f2e7ef687.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the shiny metallic ferris wheel at center? (A) white glossy boat at lower right (B) white glossy boat at center (C) white plastic boat at center" }, { "from": "gpt", "value": "(C) white plastic boat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcebc77bd84a9038.jpg", "conversations": [ { "from": "human", "value": "\nDoes green canvas coach at upper left appear under brown leather horse at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green canvas coach at upper left is below brown leather horse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95e31a472239fec8.jpg", "conversations": [ { "from": "human", "value": "\nIs brown leather coat at center-right bigger than light gray fabric jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, brown leather coat at center-right is not larger than light gray fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3afec73403a2cd74.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) gray soft fabric baby at center (B) white plastic remote at upper right" }, { "from": "gpt", "value": "(A) gray soft fabric baby at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/add00ee099644429.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brown crumbly cake at center (B) plaid shirt at upper left" }, { "from": "gpt", "value": "(A) brown crumbly cake at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7cbc5d59e1dd54c.jpg", "conversations": [ { "from": "human", "value": "\nDoes silhouette jacket at right have a greater width compared to matte black cap at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c9e50a8b2def415.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brown dirt path at lower right (B) green mossy bark at center" }, { "from": "gpt", "value": "(B) green mossy bark at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3b299f4ffec03f7.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the black matte t-shirt at right? (A) matte black cap at left (B) shiny brown hair at center" }, { "from": "gpt", "value": "(B) shiny brown hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1bf4cebce9a5b616.jpg", "conversations": [ { "from": "human", "value": "\nIs white silky waterfall at center to the left of clear water at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white silky waterfall at center is not on the left side of clear water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64c14ec6633ef985.jpg", "conversations": [ { "from": "human", "value": "\nIs green fleece hoodie at center below white jersey at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green fleece hoodie at center is positioned under white jersey at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0082ba80c9c1f48.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gray suit at center thinner than metallic silver railing at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte gray suit at center's width is less than metallic silver railing at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4f428d53eb72088.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) light brown wooden guitar at center (B) black matte microphone at center (C) matte black guitar at center (D) velvet blue jacket at upper left" }, { "from": "gpt", "value": "(D) velvet blue jacket at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/944e252bafa7bd28.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) matte yellow sweater at upper left (B) matte black laptop at upper left (C) dark gray suit at upper right" }, { "from": "gpt", "value": "(C) dark gray suit at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d0b81dda58bb18c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy figurine at center is positioned above matte white figure at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white glossy figurine at center is not above matte white figure at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/368e3caa9b0318cf.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown mud-brick village at center have a larger size compared to black fabric person at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bb7926eda7339a4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.690, 0.573) (B) (0.468, 0.516) (C) (0.742, 0.455) (D) (0.227, 0.519)" }, { "from": "gpt", "value": "(C) (0.742, 0.455)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a17cc1a75d41494.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.206, 0.886) (B) (0.815, 0.838)" }, { "from": "gpt", "value": "(A) (0.206, 0.886)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7507c0a4a48c18b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown water at center is positioned to the left of matte glass skyscraper at center-left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, brown water at center is not to the left of matte glass skyscraper at center-left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e36ddb8f2e38ac21.jpg", "conversations": [ { "from": "human", "value": "\nIs dark blue suit at center below wooden table at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dark blue suit at center is not below wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13036a60ff01e69c.jpg", "conversations": [ { "from": "human", "value": "\nIs gray sand at center below blue printed swimsuit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae0db0a494a8b031.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte white shirt at upper center is positioned to the right of bright red glossy teeth at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte white shirt at upper center is not to the right of bright red glossy teeth at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4b8607d88cd156f.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow and blue locomotive at center in front of gray gravel train track at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, yellow and blue locomotive at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/241b7112778baa6a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.240, 0.880) (B) (0.535, 0.709) (C) (0.467, 0.803) (D) (0.644, 0.912)" }, { "from": "gpt", "value": "(A) (0.240, 0.880)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80dee34b25d9f386.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if pink reflective goggles at upper center is positioned to the right of blue reflective lens goggles at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, pink reflective goggles at upper center is not on the right side of blue reflective lens goggles at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00705b9a8bc244c8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark blue t-shirt at center is positioned to the right of purple cotton shirt at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dark blue t-shirt at center is not to the right of purple cotton shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ec02b5c0315fcd1.jpg", "conversations": [ { "from": "human", "value": "\nIs pink paper box at center to the left of iridescent glass necklace at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, pink paper box at center is not on the left side of iridescent glass necklace at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80e47c65dd10e364.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent glass balcony at center to the left of green textured tree at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, transparent glass balcony at center is not to the left of green textured tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fb986294994ce71.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) brown dirt track at lower center (B) green leafy tree at left (C) matte black truck at center" }, { "from": "gpt", "value": "(B) green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/698262e941d68cf2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.797, 0.589) (B) (0.263, 0.453) (C) (0.963, 0.898) (D) (0.113, 0.867)" }, { "from": "gpt", "value": "(B) (0.263, 0.453)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9dcdae4819e4e00.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte black bus at center in relation to maroon metallic bus at right? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e61654a69a15326.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black t-shirt at upper left appear under green fabric at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, matte black t-shirt at upper left is above green fabric at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d5de7a4ea07d6ab.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte plastic monitor at center have a smaller size compared to smooth blue shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, matte plastic monitor at center might be larger than smooth blue shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b147b9cb5c0041e4.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow matte/satin jumpsuit at center smaller than yellow matte arm at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, yellow matte/satin jumpsuit at center is not smaller than yellow matte arm at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/980f118d52dc22b0.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny brown cow at center in front of brown matte cow at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, shiny brown cow at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65a411b053c6f6da.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red flower at upper left positioned at the back of matte white flower at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4acbad00596f450a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the matte khaki uniform at left? Choose among these: (A) kaki fabric uniform at center (B) yellow matte shirt at center" }, { "from": "gpt", "value": "(B) yellow matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38f9e291dcdb02c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) blue fabric map at center (B) matte blue jacket at upper left (C) matte blue and red tracksuit at center (D) matte blue jacket at upper center" }, { "from": "gpt", "value": "(C) matte blue and red tracksuit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7273bfe81ea2b66f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray wood cabin at center is positioned to the right of pink floral swimsuit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, gray wood cabin at center is to the left of pink floral swimsuit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c6409ee54bc4ac8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.963, 0.984) (B) (0.390, 0.398) (C) (0.579, 0.719)" }, { "from": "gpt", "value": "(B) (0.390, 0.398)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bb0948d7e0d3a46.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) smooth dark brown hair at center (B) matte purple dress at center (C) beige fabric dress at center (D) matte gold necklace at upper right" }, { "from": "gpt", "value": "(C) beige fabric dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff10c6850e298c16.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.300, 0.509) (B) (0.865, 0.669) (C) (0.860, 0.392)" }, { "from": "gpt", "value": "(B) (0.865, 0.669)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1fb1c0abccdf85e6.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black glasses at upper center below transparent plastic glasses at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, matte black glasses at upper center is positioned under transparent plastic glasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/965c2ca2cb88c5da.jpg", "conversations": [ { "from": "human", "value": "\nDoes green jersey at center lie behind black matte helmet at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of black matte helmet at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe6deeb0f34ffba9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the brown leafy tree at upper right? Select from: (A) green textured tree at upper center (B) green textured tree at upper left" }, { "from": "gpt", "value": "(B) green textured tree at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4c1ceb5ec416eba.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte projection screen at upper center further to camera compared to green dotted tie at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3b4ec1ef1b53363.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.238, 0.673) (B) (0.010, 0.292)" }, { "from": "gpt", "value": "(B) (0.010, 0.292)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92521b7d602e3314.jpg", "conversations": [ { "from": "human", "value": "\nDoes black glossy blazer at center appear on the right side of matte gray dress at center left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, black glossy blazer at center is positioned on the right side of matte gray dress at center left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35d3a5b2d41df5f6.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the white smooth shirt at center from the following options: (A) gray wool suit at right (B) checkered fabric robe at lower right?" }, { "from": "gpt", "value": "(B) checkered fabric robe at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed1d7143583de8a4.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) dark gray jacket at lower center (B) light gray fabric jacket at center" }, { "from": "gpt", "value": "(A) dark gray jacket at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f43647db6993af3e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) camouflage fabric pants at lower center (B) camouflage fabric uniform at left" }, { "from": "gpt", "value": "(A) camouflage fabric pants at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19fa2d75ee5ef0e3.jpg", "conversations": [ { "from": "human", "value": "\nIs green algae water at left bigger than dark brown fur seal pup at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6db3108cb7970040.jpg", "conversations": [ { "from": "human", "value": "\nIs gray matte t-shirt at center to the left of blue jacket at upper right from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, gray matte t-shirt at center is to the left of blue jacket at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ce0b6b06e1d763c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the white matte running shoe at center? Select from: (A) white matte running shoe at left (B) white matte running shorts at left" }, { "from": "gpt", "value": "(B) white matte running shorts at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e49701627dc9755f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.168, 0.531) (B) (0.693, 0.316) (C) (0.181, 0.783) (D) (0.270, 0.345)" }, { "from": "gpt", "value": "(A) (0.168, 0.531)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ddcd5eb7a131916.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) black matte penguin at lower right (B) translucent ice at upper center (C) black glossy penguin at left (D) black glossy penguin at center" }, { "from": "gpt", "value": "(B) translucent ice at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9f1a07ec04e3b6d.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the polished dark wood altar at center? Choose from: (A) matte red lamp at center (B) brown polished wood stool at lower left (C) purple wood table at right" }, { "from": "gpt", "value": "(B) brown polished wood stool at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3b560a2b9681b22.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) shiny black car at lower left (B) wooden bench at lower center" }, { "from": "gpt", "value": "(A) shiny black car at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/808c38c08530b64c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) red fabric flag at upper right (B) red velvet curtain at left" }, { "from": "gpt", "value": "(A) red fabric flag at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67fbbb613734c43b.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the sheer white curtain at center? Choose from: (A) translucent plastic screen door at center (B) multicolored fabric beach chair at center" }, { "from": "gpt", "value": "(B) multicolored fabric beach chair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8e943f5466ca456.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown dry grass at center come behind brown leafless tree at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, brown dry grass at center is in front of brown leafless tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0e956c27ca2fb66.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the dark blue jacket at center? Choose among these: (A) jeans at center (B) transparent plastic tower at center (C) black fabric at center (D) black leather jacket at center" }, { "from": "gpt", "value": "(D) black leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19ac7f440699e751.jpg", "conversations": [ { "from": "human", "value": "\nDoes white printed shirt at lower left appear under white paper at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white printed shirt at lower left is positioned under white paper at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b2663a23648f71a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.729, 0.342) (B) (0.084, 0.548)" }, { "from": "gpt", "value": "(B) (0.084, 0.548)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eeaee2910b124c7b.jpg", "conversations": [ { "from": "human", "value": "\nIs orange matte pumpkin at left wider than white soft baby at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, orange matte pumpkin at left is wider than white soft baby at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b12717e998c9377f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.800, 0.761) (B) (0.125, 0.386)" }, { "from": "gpt", "value": "(B) (0.125, 0.386)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c8e5f62bf759e90.jpg", "conversations": [ { "from": "human", "value": "\nIs gray wool blazer at center below matte black suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, gray wool blazer at center is positioned under matte black suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfa292e276468e84.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the yellow rubber tracked excavator at left among (A) yellow metallic tractor at center (B) dirt track at center?" }, { "from": "gpt", "value": "(B) dirt track at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b1947ef07d7848b.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown scaly lizard at center appear on the left side of gray rough rock at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, brown scaly lizard at center is positioned on the left side of gray rough rock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe7f1a36cd284520.jpg", "conversations": [ { "from": "human", "value": "\nIs reddish-brown bark tree at center below green leafy tree at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba8e9909e86a22b9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) matte purple shirt at center (B) lavender cotton shirt at left" }, { "from": "gpt", "value": "(A) matte purple shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36d27f7aaa13a7b4.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black bird at center have a larger size compared to fluffy black duckling at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte black bird at center is bigger than fluffy black duckling at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd2b94c0c405a27a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.073, 0.350) (B) (0.758, 0.555) (C) (0.598, 0.466)" }, { "from": "gpt", "value": "(C) (0.598, 0.466)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c82e49732568659c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white glossy minivan at center (B) satin silver sedan at left" }, { "from": "gpt", "value": "(B) satin silver sedan at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/364d2a2fd2637d13.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light blue shirt at center is positioned below yellow and black plastic microphone at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, light blue shirt at center is located below yellow and black plastic microphone at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cffd48b5806ef1bc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if polished stone dome at center is bigger than white metallic cross at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, polished stone dome at center is bigger than white metallic cross at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/acbb0c553254a6d0.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark stone archway at center have a lesser width compared to wooden gate at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, dark stone archway at center's width is less than wooden gate at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abb9345c10740fcf.jpg", "conversations": [ { "from": "human", "value": "\nIs greenish-gray water at lower center positioned in front of white metal bridge at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/075fbd181d770256.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.570, 0.247) (B) (0.497, 0.333)" }, { "from": "gpt", "value": "(A) (0.570, 0.247)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc2d87dfb9802318.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the rubberized plastic toy at lower center? (A) smooth skin hand at center (B) knitted fabric hand at center (C) wooden table at center" }, { "from": "gpt", "value": "(A) smooth skin hand at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2698afe67adc8011.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the blue fabric figure at center? (A) yellowmaterial/textureflag at lower center (B) orange fabric flag at center (C) blue matte figure at center (D) red jacket at upper center" }, { "from": "gpt", "value": "(B) orange fabric flag at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05fce36cb7e0383e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.020, 0.980) (B) (0.381, 0.475)" }, { "from": "gpt", "value": "(B) (0.381, 0.475)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b2295367456ed45.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) metallic silver rail at center (B) reflective green vest at center (C) neon yellow reflective uniform at center" }, { "from": "gpt", "value": "(A) metallic silver rail at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8c908d2dccd0713.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.417, 0.322) (B) (0.641, 0.608)" }, { "from": "gpt", "value": "(A) (0.417, 0.322)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b72028ef52f13f9.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.348, 0.639) (B) (0.624, 0.569) (C) (0.216, 0.752)" }, { "from": "gpt", "value": "(B) (0.624, 0.569)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13d0625116c636f2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte black jacket at center (B) black leather boot at lower center" }, { "from": "gpt", "value": "(A) matte black jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2358d1fc5c1ce08.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.229, 0.633) (B) (0.145, 0.514) (C) (0.785, 0.434) (D) (0.862, 0.616)" }, { "from": "gpt", "value": "(B) (0.145, 0.514)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45a9be268c96a0d8.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte yellow t-shirt at center located relative to concrete sidewalk at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b231b74cf32fc3e5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue water at center is smaller than green smooth water at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9307f13113a66f18.jpg", "conversations": [ { "from": "human", "value": "\nIs rustic stone ruins at center further to camera compared to bare branches at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7633d0788944d512.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.726, 0.619) (B) (0.998, 0.316) (C) (0.470, 0.277) (D) (0.546, 0.002)" }, { "from": "gpt", "value": "(D) (0.546, 0.002)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3355ba4a5533400b.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte orange shirt at upper center in relation to black fabric shoulder bag at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/672eca8533f83ce0.jpg", "conversations": [ { "from": "human", "value": "\nDoes white striped shirt at left appear under light blue button-down shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff71701670ab590a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at center is wider than dirt/gravel road at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, green leafy tree at center might be narrower than dirt/gravel road at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47360eeef1907a13.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green hedge at center is wider than green leafy tree at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df791fdc6f240819.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) green mossy log at center (B) green mossy tree at upper center" }, { "from": "gpt", "value": "(B) green mossy tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a94f6aa4c292f724.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) silver metallic laptop at lower center (B) white soft bed at center (C) pink fabric at left (D) pink fluffy toy at lower right" }, { "from": "gpt", "value": "(C) pink fabric at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f20a8190eed8e8ff.jpg", "conversations": [ { "from": "human", "value": "\nDoes translucent glass jar at center appear on the left side of black leather jacket at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, translucent glass jar at center is not on the left side of black leather jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d78cd64b8ad2ed21.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of brown speckled duckling at left and brown speckled duckling at center in the image provided, where is brown speckled duckling at left located with respect to brown speckled duckling at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b59ce865d2817d5b.jpg", "conversations": [ { "from": "human", "value": "\nIs silver metallic minivan at center wider than shiny black sedan at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, silver metallic minivan at center might be narrower than shiny black sedan at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b47ec872905aa66c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear glass shards at center is positioned to the right of shiny black van at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, clear glass shards at center is not to the right of shiny black van at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0c634e14a3b14de.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the teal t-shirt at center? Choose among these: (A) white paper at lower center (B) blue fabric table at center (C) teal matte shirt at center (D) green paper map at upper right" }, { "from": "gpt", "value": "(C) teal matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b10087fdaab73b0c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.977, 0.830) (B) (0.556, 0.383) (C) (0.542, 0.784) (D) (0.058, 0.681)" }, { "from": "gpt", "value": "(B) (0.556, 0.383)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4151760cf9c4d384.jpg", "conversations": [ { "from": "human", "value": "\nDoes white metal balcony at upper right come behind green leafy tree at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7379eab7ff6412d2.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) light blue striped shirt at center (B) white fabric beach chair at center (C) beige sand at lower center (D) orange fabric shirt at left" }, { "from": "gpt", "value": "(D) orange fabric shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3c0486f55f047d0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dark brown curly hair at upper left (B) blue matte shirt at center" }, { "from": "gpt", "value": "(B) blue matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc83eaf165a03752.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the camo fabric shirt at center from the following options: (A) black matte tank top at center (B) black velvet shirt at center?" }, { "from": "gpt", "value": "(A) black matte tank top at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e38a5cd18be747e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the white matte shirt at lower right? Select from: (A) green woven cloth at left (B) multicolored fabric crowd at upper center" }, { "from": "gpt", "value": "(A) green woven cloth at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05b6388dcd0a2006.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny gold roof at center positioned behind dark gray stone people at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of dark gray stone people at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69dfe4e5e29e6911.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if concrete barrier at lower center is wider than matte black sunglasses at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, concrete barrier at lower center is wider than matte black sunglasses at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85b1d82e80ad0740.jpg", "conversations": [ { "from": "human", "value": "\nIs snowy granite mountain at upper center smaller than light gray backpack at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, snowy granite mountain at upper center might be larger than light gray backpack at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adf323cb4ff699b7.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of black leather steering wheel at center in relation to black matte steering wheel at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36a550818fed51a9.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is glossy wood statue at center located relative to blue porcelain vase at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/712ce7842f73f125.jpg", "conversations": [ { "from": "human", "value": "\nIs whiteboard at upper center smaller than leather jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, whiteboard at upper center has a smaller size compared to leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2dd0edf1e2702eb6.jpg", "conversations": [ { "from": "human", "value": "\nIs brown plush armchair at right below fluffy beige pillow at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, brown plush armchair at right is located below fluffy beige pillow at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be294b82878251f8.jpg", "conversations": [ { "from": "human", "value": "\nDoes beige stone pavement at center appear on the left side of gray rock at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, beige stone pavement at center is to the right of gray rock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b621edcec1fb6d06.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) wooden park bench at lower right (B) black wrought iron bench at lower right" }, { "from": "gpt", "value": "(A) wooden park bench at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90d05781021a26c8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark brown wood carving at center is positioned to the right of brown carved figure at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, dark brown wood carving at center is not on the right side of brown carved figure at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5470775f1847ed4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.369, 0.664) (B) (0.648, 0.853) (C) (0.404, 0.695)" }, { "from": "gpt", "value": "(B) (0.648, 0.853)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/122cfab35c8bb7aa.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte coat at left lie in front of clear glass vase at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df630da4a26cb898.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden at center is positioned to the right of brown wooden door at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, wooden at center is not on the right side of brown wooden door at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/150aaba251d05914.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte sweater at center is positioned below black turtleneck sweater at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, black matte sweater at center is above black turtleneck sweater at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f23c4349aeb784c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte gray table at center is wider than floral fabric cushion at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of matte gray table at center exceeds that of floral fabric cushion at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/182cf0c1df598200.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue matte sweater at left have a greater width compared to multicolored pixelated hoodie at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, blue matte sweater at left is wider than multicolored pixelated hoodie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d98b059d247f3a08.jpg", "conversations": [ { "from": "human", "value": "\nIs pink fabric at center to the left of white soft pillow at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, pink fabric at center is to the left of white soft pillow at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b9d24b61029adcc.jpg", "conversations": [ { "from": "human", "value": "\nIs green denim jacket at center behind orange matte pumpkin at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is behind orange matte pumpkin at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de813a515dd417e0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) transparent water at center (B) blue matte cargo ship at center" }, { "from": "gpt", "value": "(A) transparent water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42d0201d1327fd08.jpg", "conversations": [ { "from": "human", "value": "\nIs camouflage uniform at center thinner than matte black helmet at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c7de8c0a68d25b5.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white matte table at upper center located in relation to black glossy table at upper right in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/691c03af2f78c813.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.896, 0.342) (B) (0.791, 0.087)" }, { "from": "gpt", "value": "(B) (0.791, 0.087)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37e198cb7c46709c.jpg", "conversations": [ { "from": "human", "value": "\nDoes dry grass hut at center have a lesser width compared to green leafy palm tree at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, dry grass hut at center has a lesser width compared to green leafy palm tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc065703925f9feb.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) green rocky mountain at upper right (B) green leafy tree at left (C) green rocky mountain at upper left (D) snowy rock mountain at center" }, { "from": "gpt", "value": "(B) green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e61833944dab6856.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.087, 0.575) (B) (0.986, 0.858) (C) (0.895, 0.720) (D) (0.479, 0.580)" }, { "from": "gpt", "value": "(D) (0.479, 0.580)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1fe960365e477f1.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of brown rocky mountain at upper center in reference to brown corrugated metal houses at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0462e7d07045146f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.265, 0.872) (B) (0.842, 0.256) (C) (0.383, 0.787) (D) (0.641, 0.272)" }, { "from": "gpt", "value": "(A) (0.265, 0.872)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/350c4c2fc48be4f5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) white shirt at upper center (B) blue cotton shirt at center" }, { "from": "gpt", "value": "(A) white shirt at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17ede399ef601fa4.jpg", "conversations": [ { "from": "human", "value": "\nDoes silhouette fabric couple at center lie in front of gray fabric tank top at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, silhouette fabric couple at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d824345e468df1f5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.201, 0.836) (B) (0.745, 0.642)" }, { "from": "gpt", "value": "(A) (0.201, 0.836)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98266c970ff94c08.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of light beige fabric at center in relation to light brown hair at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f18e66f1b4876e02.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown leather jacket at center smaller than smooth white shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, dark brown leather jacket at center is smaller than smooth white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98a0795e7c6e430c.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte tank top at center thinner than matte red tank top at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white matte tank top at center has a lesser width compared to matte red tank top at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a3e3ddc7f20c085.jpg", "conversations": [ { "from": "human", "value": "\nDoes denim jacket at center have a larger size compared to dark gray jacket at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c541f893f73f4c62.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the matte brown shirt at center? Choose from: (A) brown matte pot at lower left (B) striped cotton shirt at center (C) brown crispy chicken at center" }, { "from": "gpt", "value": "(B) striped cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a64c76432fa5da00.jpg", "conversations": [ { "from": "human", "value": "\nDoes snowy rock mountain at upper center come in front of matte gray minivan at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, snowy rock mountain at upper center is behind matte gray minivan at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe72cdf5ecf51cd8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.604, 0.723) (B) (0.621, 0.559)" }, { "from": "gpt", "value": "(B) (0.621, 0.559)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a92f825644c8b76.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) white soft robe at center (B) white soft robe at lower center (C) dark gray fabric shirt at center (D) matte white robe at center" }, { "from": "gpt", "value": "(B) white soft robe at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93ed6b696e95f88a.jpg", "conversations": [ { "from": "human", "value": "\nDoes greenish water at center appear over metallic red boat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, greenish water at center is not above metallic red boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46704307c028323e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) metallic silver golf club at center (B) shiny silver golf ball at center (C) green grass at center" }, { "from": "gpt", "value": "(C) green grass at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7907e2dd2ec6502b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white canvas bag at center is thinner than brown silky hair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white canvas bag at center is not thinner than brown silky hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17014d31e4c153da.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.324, 0.480) (B) (0.334, 0.558)" }, { "from": "gpt", "value": "(B) (0.334, 0.558)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7182f37cd75675e5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) black floral blouse at upper right (B) pink checkered shirt at left" }, { "from": "gpt", "value": "(B) pink checkered shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f77cab80361a978.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) blue metallic bus at center (B) bare branches at upper center (C) green leafy tree at left" }, { "from": "gpt", "value": "(C) green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba1fcaf8f52c5592.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden wagon at center is smaller than translucent plastic toy at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, wooden wagon at center is not smaller than translucent plastic toy at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6942c8aa585dfeb.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.430, 0.447) (B) (0.660, 0.758)" }, { "from": "gpt", "value": "(B) (0.660, 0.758)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba53373cfb0574e7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny metallic dress at center is wider than shiny pink dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, shiny metallic dress at center has a greater width compared to shiny pink dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8c144e7bd362970.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center smaller than metallic gray pole at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, green leafy tree at center might be larger than metallic gray pole at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41d7393bf4cb49ff.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.639, 0.141) (B) (0.114, 0.991)" }, { "from": "gpt", "value": "(A) (0.639, 0.141)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7a3eb6d0a3454c8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if translucent plastic wrapped food at center is positioned to the left of shiny brown meat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, translucent plastic wrapped food at center is positioned on the left side of shiny brown meat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43d572f459d1214e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.666, 0.364) (B) (0.296, 0.053)" }, { "from": "gpt", "value": "(A) (0.666, 0.364)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05eeee9fdbac8bce.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) golden crusty bread at upper left (B) green crisp cucumber at center" }, { "from": "gpt", "value": "(B) green crisp cucumber at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa0765645ef17536.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown fluffy duckling at center appear on the right side of brown fluffy duckling at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find brown fluffy duckling at center to the right of brown fluffy duckling at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33c76495f9d890ec.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) shiny black suit at center (B) black satin vest at center (C) black jersey at center (D) white leather jacket at center" }, { "from": "gpt", "value": "(A) shiny black suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/661295554b146a8a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) dark reflective water at lower center (B) dark gray stone tower at center-left (C) dark gray stone church at upper left, is positioned farthest from the scaffolding wood tower at left?" }, { "from": "gpt", "value": "(A) dark reflective water at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/065440a7bd48dc56.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue paper at center appear on the right side of blue matte book at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, blue paper at center is not on the right side of blue matte book at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77fb857c38188adb.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange fabric astronaut suit at center appear on the left side of brown fuzzy costume at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, orange fabric astronaut suit at center is not to the left of brown fuzzy costume at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1bdf0ff0890e226.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.538, 0.894) (B) (0.362, 0.520) (C) (0.263, 0.411)" }, { "from": "gpt", "value": "(C) (0.263, 0.411)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f148053b3e37826.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white fabric lampshade at right (B) clear crystal chandelier at upper center (C) wooden display case at center (D) velvet-patterned armchair at right" }, { "from": "gpt", "value": "(A) white fabric lampshade at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04fa45ca99c1beec.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of matte red truck at center in reference to clear glass window at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5647439875f1f474.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center further to the viewer compared to floral-patterned fabric dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4b652cc6ddb6e3c.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the blue knit sweater at center? (A) gray hair at lower right (B) matte black microphone at center (C) black matte microphone at center (D) black matte shirt at upper right" }, { "from": "gpt", "value": "(D) black matte shirt at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3030f80233c1b59.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white plastic window at center is positioned above white glossy window at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57ecada67eb547f5.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of transparent glass window at left in relation to blue textured vent at right? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c86732b82e30d82.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.572, 0.398) (B) (0.617, 0.411)" }, { "from": "gpt", "value": "(B) (0.617, 0.411)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e53ddd5813d448d8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white matte snow at center (B) metallic gray engine at left" }, { "from": "gpt", "value": "(B) metallic gray engine at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a86fea8a2754972.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.851, 0.703) (B) (0.741, 0.508)" }, { "from": "gpt", "value": "(B) (0.741, 0.508)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7cf7b5a2ea133c7.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.920, 0.820) (B) (0.522, 0.672) (C) (0.259, 0.602)" }, { "from": "gpt", "value": "(C) (0.259, 0.602)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83dd5bfe0cdaca9e.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white fabric at center in reference to brown feathered bird at left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ebd78fd582825dd.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.456, 0.675) (B) (0.489, 0.838)" }, { "from": "gpt", "value": "(A) (0.456, 0.675)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cb66f201d2f501d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) striped cotton shirt at center (B) green plaid shorts at center" }, { "from": "gpt", "value": "(B) green plaid shorts at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df804600f9cc6822.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dry wood vine at left (B) green leafy tree at center" }, { "from": "gpt", "value": "(B) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5938a8cbc24576d2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.843, 0.717) (B) (0.791, 0.175)" }, { "from": "gpt", "value": "(B) (0.791, 0.175)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/405f9fcc7133a94b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if snowy rocky mountain at center is wider than green matte tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bae504798dfb835.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth beige portrait at upper center is bigger than matte plastic portrait at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, smooth beige portrait at upper center has a larger size compared to matte plastic portrait at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a2a8d72b3006605.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green leafy tree at upper left and wooden dock at center in the image provided, where is green leafy tree at upper left located with respect to wooden dock at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b23abfd122b4572a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) light brown wooden stick at lower left (B) clear water at center" }, { "from": "gpt", "value": "(A) light brown wooden stick at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73db64931a0eb692.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of green grassy at center in reference to brown wooden bench at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24e95ad04aaee29e.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green leafy tree at center located in relation to yellow matte flower at lower center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8cbed108426cbfa.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy swan at center bigger than silvery metallic bird at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white glossy swan at center has a larger size compared to silvery metallic bird at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4824ddecb2b6a93.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.735, 0.622) (B) (0.724, 0.617) (C) (0.321, 0.845)" }, { "from": "gpt", "value": "(C) (0.321, 0.845)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9bbd71f6bf73b67.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.369, 0.539) (B) (0.701, 0.345)" }, { "from": "gpt", "value": "(A) (0.369, 0.539)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b71ea2431a6aebd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.471, 0.136) (B) (0.077, 0.106)" }, { "from": "gpt", "value": "(A) (0.471, 0.136)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c66218738a5f4d75.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.344, 0.908) (B) (0.552, 0.970)" }, { "from": "gpt", "value": "(B) (0.552, 0.970)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75abab0702d629a1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) white matte golf club at left (B) navy blue jersey at center" }, { "from": "gpt", "value": "(A) white matte golf club at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c04475810ae6ad8.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center appear under black glossy bull at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green grass at center is below black glossy bull at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12598a3c61743f4d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) matte black cube at center (B) orange glossy bird at center (C) purple glossy triangle at center" }, { "from": "gpt", "value": "(B) orange glossy bird at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d38bbbf930fa4dff.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow leather jacket at center is smaller than jeans at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, yellow leather jacket at center occupies less space than jeans at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4ae34c58805ce9e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) blue fabric shirt at upper right (B) black plastic microphone at upper right (C) black plastic microphone at center" }, { "from": "gpt", "value": "(B) black plastic microphone at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52270942513f64a0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper center is wider than metallic silver pole at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green leafy tree at upper center is wider than metallic silver pole at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32b79d90568ba8ec.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the striped cotton shirt at center? Choose among these: (A) matte black backpack at left (B) smooth concrete tarmac at center" }, { "from": "gpt", "value": "(A) matte black backpack at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8ee2835275e0f6c.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte gray jacket at center in relation to flaming wood at lower left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afed1fffad338048.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the brown matte bird at center? Choose from: (A) green leafy tree at upper right (B) gray textured tree trunk at center (C) brown textured tree trunk at upper center" }, { "from": "gpt", "value": "(B) gray textured tree trunk at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10607e3b7ed2ac45.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black car at right is wider than silver metallic sedan at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, matte black car at right has a greater width compared to silver metallic sedan at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c2cf460eee2c0bb.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the black plastic hanger at center among (A) matte black hanger at center (B) red checkered shirt at center (C) metallic silver hanger at center?" }, { "from": "gpt", "value": "(B) red checkered shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d47fe6391d459e3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the white smooth calf at center? Select from: (A) brown matte cow at center (B) green leafy tree at upper center" }, { "from": "gpt", "value": "(B) green leafy tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b36663d328f0766.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue fabric dress at center come in front of dark skin bald head at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is behind dark skin bald head at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f185a025c63d7a06.jpg", "conversations": [ { "from": "human", "value": "\nDoes gold polished dome at center lie in front of green metallic street sign at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d37049bc77496890.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.288, 0.058) (B) (0.939, 0.950)" }, { "from": "gpt", "value": "(A) (0.288, 0.058)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be2f4de3515d16f6.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green leafy tree at lower left located in relation to green leafy tree at upper left in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a09ef603b490114.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if weathered stone hut at center is smaller than rusty metal roof at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, weathered stone hut at center is smaller than rusty metal roof at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b683a57fb53dcc87.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue fabric jacket at left is wider than white cotton shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of blue fabric jacket at left exceeds that of white cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d96c06cb4bc72aa.jpg", "conversations": [ { "from": "human", "value": "\nDoes printed fabric dress at center have a greater width compared to matte black sandal at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, printed fabric dress at center is wider than matte black sandal at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffbaaf939f0fbfab.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.744, 0.434) (B) (0.434, 0.492)" }, { "from": "gpt", "value": "(B) (0.434, 0.492)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ebe9ca0656b15dfb.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.177, 0.689) (B) (0.159, 0.495) (C) (0.573, 0.569) (D) (0.479, 0.461)" }, { "from": "gpt", "value": "(C) (0.573, 0.569)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f471712008ebb67.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.904, 0.266) (B) (0.344, 0.927)" }, { "from": "gpt", "value": "(A) (0.904, 0.266)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed768f9715f23f07.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the pink cotton shirt at left? Choose among these: (A) black leather purse at center (B) white cotton t-shirt at center (C) striped hoodie at center (D) metal fence at center" }, { "from": "gpt", "value": "(B) white cotton t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68836e255e2531d6.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte beige shirt at center located relative to matte black juggling pins at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9fe80af1bcad3ea8.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.832, 0.784) (B) (0.912, 0.597) (C) (0.514, 0.541)" }, { "from": "gpt", "value": "(B) (0.912, 0.597)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cda0157e020a064.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dirt/gravel path at center is positioned below clear water at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, dirt/gravel path at center is above clear water at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4dbe27efdb049e12.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte canoe at center further to camera compared to yellow plastic paddle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of yellow plastic paddle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80933640f29bf915.jpg", "conversations": [ { "from": "human", "value": "\nDoes concrete parking lot at center appear under matte khaki pants at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, concrete parking lot at center is not below matte khaki pants at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/429e9126f6222f15.jpg", "conversations": [ { "from": "human", "value": "\nIs orange printed leopard at center to the left of black leather glove at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, orange printed leopard at center is not on the left side of black leather glove at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e68c0824c2caca91.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) blue matte jacket at center (B) white matte helmet at upper center (C) white matte helmet at center" }, { "from": "gpt", "value": "(C) white matte helmet at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d635f3b435c32dce.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth concrete pavement at center lie behind matte white shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, smooth concrete pavement at center is in front of matte white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46ab36cc09b3054a.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray suit at center lie in front of floral pants at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is in front of floral pants at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7cc30d6c0b1fc04.jpg", "conversations": [ { "from": "human", "value": "\nIs brown brick church at center further to camera compared to green leafy tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88c56da21f2e97d0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) neon yellow reflective vest at center (B) glossy black helmet at center" }, { "from": "gpt", "value": "(A) neon yellow reflective vest at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df29e5e94dec0bf8.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the brown glossy horse at center? Choose from: (A) rusty metal wagon at center (B) purple cotton shirt at center (C) floral shirt at center" }, { "from": "gpt", "value": "(A) rusty metal wagon at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d5e4acbaee70215.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte door at center is positioned to the right of white wooden door at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white matte door at center is not to the right of white wooden door at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02cdfbdc0968987d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) concrete at center (B) green leafy palm tree at left" }, { "from": "gpt", "value": "(A) concrete at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfbea064c9911bd8.jpg", "conversations": [ { "from": "human", "value": "\nIs silver metallic tower at center to the right of gray concrete building at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, silver metallic tower at center is to the left of gray concrete building at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/963a76c43256b05a.jpg", "conversations": [ { "from": "human", "value": "\nDoes red cotton shirt at center appear on the right side of red cotton polo shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find red cotton shirt at center to the right of red cotton polo shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a547275263559b5.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric shirt at center positioned at the back of yellow cotton shirt at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of yellow cotton shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90559a2b60e0e23a.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is smooth skin hand at center located relative to blue plastic scissors at center-right? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84a10cae2385b876.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.676, 0.870) (B) (0.523, 0.719)" }, { "from": "gpt", "value": "(B) (0.523, 0.719)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00272c8990ce05be.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) matte brown jacket at center (B) green paper chain at center" }, { "from": "gpt", "value": "(B) green paper chain at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b160b4bd61fb755.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of dark blue sweater at center and wooden table at center in the image provided, where is dark blue sweater at center located with respect to wooden table at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35bbc31bd19d215b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) smooth brown tree trunk at right (B) smooth gray bark tree at right, is positioned closest to the weathered wood at lower center?" }, { "from": "gpt", "value": "(A) smooth brown tree trunk at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c2b8f16d9493014.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black tank top at center above blue denim jeans at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black tank top at center is not above blue denim jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5eeb8a5b55c03433.jpg", "conversations": [ { "from": "human", "value": "\nIs orange matte fried snack at center to the right of coconut shell at left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, orange matte fried snack at center is positioned on the right side of coconut shell at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62b5d95f98dc0939.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white cotton jacket at lower right (B) matte black car at left (C) dark gray coat at center right" }, { "from": "gpt", "value": "(C) dark gray coat at center right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb259fecb983a561.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the white matte baseball hat at left from the following options: (A) black and white striped microphone at center (B) yellow matte shirt at left (C) white printed baseball cap at upper right (D) white matte hat at upper right?" }, { "from": "gpt", "value": "(B) yellow matte shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/008a0c001ea6cd48.jpg", "conversations": [ { "from": "human", "value": "\nIs white satin dress at center wider than satin purple dress at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white satin dress at center is not wider than satin purple dress at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79275b45ba4e5f4b.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte shirt at center have a lesser width compared to black matte bicycle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55f934da04fb89a3.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) dark fabric pants at center (B) green mossy cave at center (C) dirt path at center" }, { "from": "gpt", "value": "(C) dirt path at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d59833cb3d62b5f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.713, 0.511) (B) (0.321, 0.447)" }, { "from": "gpt", "value": "(B) (0.321, 0.447)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/572dba8c2eb71612.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.694, 0.436) (B) (0.999, 0.342)" }, { "from": "gpt", "value": "(B) (0.999, 0.342)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0974b7da309384f4.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte orange cap at center appear under green reflective lens at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte orange cap at center is not below green reflective lens at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2fd7491607ffc16.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden bridge at upper center thinner than white matte baseball cap at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/499119fcd398a1b2.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) satin white bikini at center (B) matte black bikini at center" }, { "from": "gpt", "value": "(A) satin white bikini at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/897f086b3aca1eb7.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center to the right of wooden gazebo at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find green leafy tree at center to the right of wooden gazebo at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fc440b67bb3746a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) green leafy tree at left (B) matte black headrest at center" }, { "from": "gpt", "value": "(B) matte black headrest at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/63b2cda888ddd096.jpg", "conversations": [ { "from": "human", "value": "\nIs black reflective sunglasses at center bigger than green plastic glasses at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88aeda1c301205fe.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.202, 0.417) (B) (0.125, 0.248) (C) (0.983, 0.497) (D) (0.734, 0.481)" }, { "from": "gpt", "value": "(B) (0.125, 0.248)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18fec61d25a1f960.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.874, 0.316) (B) (0.007, 0.358)" }, { "from": "gpt", "value": "(B) (0.007, 0.358)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5be54a8db4bd05c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) weathered wood fence at center (B) brown speckled feathers at center, is positioned farthest from the green grass at lower center?" }, { "from": "gpt", "value": "(A) weathered wood fence at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7fc445941dcd38b.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white matte skirt at center and white quilted leather boot at center in the image provided, where is white matte skirt at center located with respect to white quilted leather boot at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da5c59c57b888126.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of dry skin at center in reference to yellow gauze at lower left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a9fc5708c6e7e71.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.280, 0.491) (B) (0.763, 0.594) (C) (0.364, 0.423)" }, { "from": "gpt", "value": "(C) (0.364, 0.423)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c29506a2d712f635.jpg", "conversations": [ { "from": "human", "value": "\nIs pink fabric baseball cap at center wider than pink satin baseball hat at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, pink fabric baseball cap at center has a greater width compared to pink satin baseball hat at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dfd6283d8d32ed46.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the translucent glass cup at table center? Choose among these: (A) brown fabric baseball cap at center (B) yellow fabric cap at left (C) camo fabric shirt at center" }, { "from": "gpt", "value": "(A) brown fabric baseball cap at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a041066ec2439161.jpg", "conversations": [ { "from": "human", "value": "\nIs satin dress at center positioned in front of satin dress at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f252b6bb3198595.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte wetsuit at center wider than white glossy surfboard at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8477c7a3d1b70d15.jpg", "conversations": [ { "from": "human", "value": "\nIs green satin saree at center in front of black silk saree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green satin saree at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c70eb46a271b0160.jpg", "conversations": [ { "from": "human", "value": "\nIs blue stone water at lower left below green copper dome at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, blue stone water at lower left is located below green copper dome at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/383c36ab0d36019c.jpg", "conversations": [ { "from": "human", "value": "\nDoes multicolored plastic chips at right have a lesser width compared to dark brown leather shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, multicolored plastic chips at right might be wider than dark brown leather shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95e6101fbf383934.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) floral fabric dress at center (B) floral print fabric dress at center (C) spiderman towel at upper left (D) black plastic goggles at upper center" }, { "from": "gpt", "value": "(D) black plastic goggles at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70220c58599b273a.jpg", "conversations": [ { "from": "human", "value": "\nIs light green cotton shirt at center thinner than black fabric bag at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, light green cotton shirt at center is thinner than black fabric bag at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e65d6d239e45734c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny gray horse at left is positioned above white matte sheep at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, shiny gray horse at left is located above white matte sheep at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/403d9fa96561a169.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the sandy beach at lower left? Choose among these: (A) brown rough rock at center (B) smooth gray rock at center" }, { "from": "gpt", "value": "(A) brown rough rock at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb3f67aeb5687c83.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if bare wood tree at center is thinner than smooth gray steeple at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, bare wood tree at center is not thinner than smooth gray steeple at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6021a305dec819e6.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the red running shoe at center? (A) black matte shorts at center (B) gray fabric shirt at center" }, { "from": "gpt", "value": "(A) black matte shorts at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c0c4435cbded34b.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of white matte motorcycle at center in relation to matte black helmet at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/398b4c0d9b39eb5f.jpg", "conversations": [ { "from": "human", "value": "\nIs concrete stairs at center bigger than black metal/rail at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, concrete stairs at center is larger in size than black metal/rail at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef276562d42fc107.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny orange race car at lower left appear on the right side of white glossy license plate at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, shiny orange race car at lower left is not to the right of white glossy license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a29c67335bb722c4.jpg", "conversations": [ { "from": "human", "value": "\nWhere is satin pink doll at left located in relation to green glossy hair at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4adf23b4eb3f2dae.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of dark brown fabric at lower center in relation to pink fabric at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9be59fef25eb44f6.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) dark blue jacket at right (B) green grass football field at center" }, { "from": "gpt", "value": "(B) green grass football field at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c101882195a0692d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) shiny silver frame at center (B) shiny black frame at center" }, { "from": "gpt", "value": "(B) shiny black frame at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/093c73de093b1b25.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.454, 0.256) (B) (0.460, 0.853)" }, { "from": "gpt", "value": "(B) (0.460, 0.853)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0f1d6d0770e0ecb.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dirt path at center (B) green leafy ferns at center (C) green leafy vegetation at center (D) green grassy hill at upper left" }, { "from": "gpt", "value": "(D) green grassy hill at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9418ab02ef5390e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the black textured blazer at center? (A) striped fabric shirt at center (B) white t-shirt at center (C) brown matte sweater at center" }, { "from": "gpt", "value": "(A) striped fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7d4ace24879c158.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green matte jacket at center in relation to green matte sunglasses at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d73cd6c651c51725.jpg", "conversations": [ { "from": "human", "value": "\nWhere is navy blue dress at center located in relation to purple velvet pillow at lower left in the image? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01047579b8e4cbab.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) light brown wooden pole at upper center (B) maroon fabric monk at left (C) white matte vest at center (D) black cotton shirt at center" }, { "from": "gpt", "value": "(A) light brown wooden pole at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e97700ec7d4195e0.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the matte skin at center from the following options: (A) orange rubber dinghy at center (B) matte black shorts at center (C) red fabric life jacket at lower center (D) plaid shorts at center?" }, { "from": "gpt", "value": "(A) orange rubber dinghy at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c3802a1bd3c842e.jpg", "conversations": [ { "from": "human", "value": "\nIs black leather jacket at upper right behind matte brown pastry at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black leather jacket at upper right is behind matte brown pastry at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4606102cf0890e7e.jpg", "conversations": [ { "from": "human", "value": "\nIs silver metallic van at lower left smaller than black plastic traffic light at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56404b1ce91a5dc0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if printed fabric shirt at left is positioned to the right of transparent plastic container at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, printed fabric shirt at left is to the left of transparent plastic container at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18954603cdf83172.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic mesh fence at center in front of white fabric man at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of white fabric man at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd484e8b2420809b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.591, 0.895) (B) (0.151, 0.859)" }, { "from": "gpt", "value": "(B) (0.151, 0.859)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b4b0d9cfe4a7806.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) gold chain with pendant at center (B) bluematteeye at upper center (C) matte black goggles at center (D) brown braided hair at upper left" }, { "from": "gpt", "value": "(A) gold chain with pendant at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2195c21e70e69d8e.jpg", "conversations": [ { "from": "human", "value": "\nIs white plastic pole at center above white plastic lamp post at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e45b8fb6bb19af69.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.902, 0.736) (B) (0.120, 0.294) (C) (0.066, 0.633)" }, { "from": "gpt", "value": "(B) (0.120, 0.294)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f3b322dd6b96b1f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.295, 0.453) (B) (0.210, 0.278)" }, { "from": "gpt", "value": "(A) (0.295, 0.453)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b9d6b9f5960df82.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown wooden train track at lower center is smaller than metallic wire mesh at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, brown wooden train track at lower center might be larger than metallic wire mesh at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae319b4a0683d501.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the silver metallic ring at center? (A) black matte shirt at center (B) blue patterned shirt at center" }, { "from": "gpt", "value": "(B) blue patterned shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/905da1847b4d5ff5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) brown wood carving at center (B) white wood railing at center" }, { "from": "gpt", "value": "(A) brown wood carving at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/047eedd5f17d8809.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) smooth fabric shirt at center (B) smooth concrete bench at lower center (C) smooth fabric sit at lower right" }, { "from": "gpt", "value": "(A) smooth fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eef086a3ba85c22c.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy at center to the right of bark-white tree at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, green grassy at center is to the left of bark-white tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d6b0350f57a35b3.jpg", "conversations": [ { "from": "human", "value": "\nIs white fluffy cloud at center below brown matte chimney at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white fluffy cloud at center is not positioned below brown matte chimney at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/968af31a275c6d0c.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth water at center behind red matte sailboat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a33bdece303caa25.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at left is positioned to the left of white wooden porch at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find green leafy tree at left to the left of white wooden porch at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7bd79894b275c6f8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.400, 0.241) (B) (0.311, 0.186)" }, { "from": "gpt", "value": "(B) (0.311, 0.186)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a94da24fbafce78.jpg", "conversations": [ { "from": "human", "value": "\nIs orange printed fabric at center thinner than shiny black skin at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, orange printed fabric at center is not thinner than shiny black skin at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddeecb67e78ec2aa.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.993, 0.959) (B) (0.934, 0.991) (C) (0.456, 0.873)" }, { "from": "gpt", "value": "(B) (0.934, 0.991)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/000ba28d70b1a999.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) leather sandal at lower center (B) red plaid scarf at upper center" }, { "from": "gpt", "value": "(A) leather sandal at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cafb557f49a81a8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.540, 0.902) (B) (0.019, 0.963)" }, { "from": "gpt", "value": "(B) (0.019, 0.963)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95aea49d384cb7eb.jpg", "conversations": [ { "from": "human", "value": "\nDoes green fabric bag at lower left appear over golden brown baguette at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green fabric bag at lower left is above golden brown baguette at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4d16535aa09fca9.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white satin dress at left in reference to matte purple hat at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23a8a1788228ae88.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy bush at upper center is positioned to the left of green leafy tree at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, green leafy bush at upper center is to the right of green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/facca0405d8b3717.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy pillar at left have a greater width compared to striped fabric stool at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a204cf798dc613f.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center thinner than shiny black dog at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/025684ed53f3670c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray suit at center is smaller than matte black suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, dark gray suit at center occupies less space than matte black suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/359f0419a8922cfe.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the blue fabric shirt at center among (A) gray fabric dress at center (B) blue water at center?" }, { "from": "gpt", "value": "(A) gray fabric dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ade1a57e5bf74a0.jpg", "conversations": [ { "from": "human", "value": "\nIs brown textured stone at center positioned at the back of brown leather boot at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, brown textured stone at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d262c966f9513d7.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) purple fabric shirt at left (B) green fleece hoodie at center (C) matte red sweater at lower right (D) light pink fleece at center" }, { "from": "gpt", "value": "(C) matte red sweater at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3561bd671ebcd85.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) white glossy truck at center (B) white matte trailer truck at center" }, { "from": "gpt", "value": "(A) white glossy truck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4677fc0a35d2d378.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.570, 0.827) (B) (0.428, 0.466) (C) (0.150, 0.630) (D) (0.503, 0.455)" }, { "from": "gpt", "value": "(D) (0.503, 0.455)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e1e10fdd921eb6c.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the white glossy bus at center? Choose from: (A) shiny black sedan at left (B) silver metallic car at center" }, { "from": "gpt", "value": "(A) shiny black sedan at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bb54c3c58434740.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.689, 0.713) (B) (0.453, 0.519) (C) (0.314, 0.667)" }, { "from": "gpt", "value": "(B) (0.453, 0.519)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0665f80262c7b81f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.738, 0.688) (B) (0.090, 0.759)" }, { "from": "gpt", "value": "(A) (0.738, 0.688)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b4d7f1e32823a76.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte gray t-shirt at center is smaller than black matte sunglasses at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, matte gray t-shirt at center might be larger than black matte sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d27ec8b6569d443.jpg", "conversations": [ { "from": "human", "value": "\nIs gravelly asphalt driveway at center smaller than metal chain-link fence at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, gravelly asphalt driveway at center is smaller than metal chain-link fence at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/985c572d3faa3dca.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the shiny red tomatoes at center? (A) orange glossy oranges at right (B) shiny red onion at left (C) ripe red tomatoes at center (D) shiny plastic crates at center" }, { "from": "gpt", "value": "(B) shiny red onion at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88863fe294f4eaec.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) black matte microphone at center (B) maroon knit sweater at left" }, { "from": "gpt", "value": "(B) maroon knit sweater at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad6994947414057d.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the fuzzy brown coat at left? Choose from: (A) matte gray suit at center (B) matte blue dress at center" }, { "from": "gpt", "value": "(A) matte gray suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11b10f0db86063e0.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green leafy tree at upper center and yellowish rock at center in the image provided, where is green leafy tree at upper center located with respect to yellowish rock at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b00baab3fb4c54e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) white cotton shirt at center (B) blue fabric backpack at upper right" }, { "from": "gpt", "value": "(B) blue fabric backpack at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0449e2c545fb8797.jpg", "conversations": [ { "from": "human", "value": "\nIs white soft fabric baby at center to the right of dark brown fuzzy hair at upper left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find white soft fabric baby at center to the right of dark brown fuzzy hair at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/443ecd71681d9b60.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.374, 0.305) (B) (0.428, 0.373)" }, { "from": "gpt", "value": "(B) (0.428, 0.373)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c96f324cc4452b2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue fabric flag at center is bigger than white matte flag at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, blue fabric flag at center has a larger size compared to white matte flag at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5172d929b8d14ae3.jpg", "conversations": [ { "from": "human", "value": "\nIs blue striped shirt at center positioned before dark blue suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/694bbd12e567b7ec.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray checkered shirt at lower right is thinner than printed cotton t-shirt at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, gray checkered shirt at lower right's width is less than printed cotton t-shirt at lower left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/823bc110caa3630e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.164, 0.664) (B) (0.443, 0.591) (C) (0.445, 0.994) (D) (0.388, 0.661)" }, { "from": "gpt", "value": "(A) (0.164, 0.664)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8878fbc9cb5b78e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.504, 0.383) (B) (0.547, 0.716) (C) (0.498, 0.491)" }, { "from": "gpt", "value": "(A) (0.504, 0.383)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/843c11bbe05667a3.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark fabric crowd at lower center lie in front of metallic silver microphone at center-right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5defbd3b7eb1d147.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.067, 0.759) (B) (0.563, 0.505)" }, { "from": "gpt", "value": "(A) (0.067, 0.759)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff7088b464530718.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) matte black hand at center (B) smooth skin hand at center" }, { "from": "gpt", "value": "(A) matte black hand at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8436af8b71e3542.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) tan fabric bag at center (B) metallic silver monitor at center" }, { "from": "gpt", "value": "(A) tan fabric bag at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec56b64cb7f5a026.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) green matte tank top at center (B) metallic umbrella at upper left" }, { "from": "gpt", "value": "(B) metallic umbrella at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa64cf80c6c321bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) blue matte shirt at center (B) black t-shirt at center (C) denim fabric chair at center (D) black cotton shirt at center" }, { "from": "gpt", "value": "(B) black t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/178b234e8e546adf.jpg", "conversations": [ { "from": "human", "value": "\nIs black fabric table at center smaller than denim shirt at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, black fabric table at center might be larger than denim shirt at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e58f3fb751da78c1.jpg", "conversations": [ { "from": "human", "value": "\nDoes white striped shirt at center come behind matte white shirt at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of matte white shirt at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0783c0299b12fca.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black t-shirt at left below dark blue t-shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black t-shirt at left is below dark blue t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ea41b2755a4e36d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.709, 0.817) (B) (0.451, 0.573)" }, { "from": "gpt", "value": "(B) (0.451, 0.573)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6c7b4adb0e9d84e.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny silver armor at center have a greater width compared to silver metallic armor at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5674c6a4fb7aad16.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue striped shirt at center is positioned to the left of black fabric jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, blue striped shirt at center is positioned on the left side of black fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3702d657cd897b5.jpg", "conversations": [ { "from": "human", "value": "\nDoes rugged stone mountain at upper center have a greater width compared to matte black bicycle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, rugged stone mountain at upper center has a greater width compared to matte black bicycle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8de825886d605960.jpg", "conversations": [ { "from": "human", "value": "\nWhere is concrete sidewalk at center located in relation to silver metallic hatchback at lower left in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1835189ee36ee5ae.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.996, 0.656) (B) (0.914, 0.792)" }, { "from": "gpt", "value": "(A) (0.996, 0.656)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0265bcbac397301.jpg", "conversations": [ { "from": "human", "value": "\nIs white fur cat at upper left bigger than matte cardboard box at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, white fur cat at upper left is larger in size than matte cardboard box at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4950c872d6978478.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte gray tank top at center is positioned to the left of matte white tank top at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, matte gray tank top at center is to the right of matte white tank top at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/830cfd71c8e082ee.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.903, 0.583) (B) (0.708, 0.758) (C) (0.315, 0.881) (D) (0.525, 0.761)" }, { "from": "gpt", "value": "(D) (0.525, 0.761)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d0d44c65cf1168a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte blue jacket at center (B) shiny red toy car at center" }, { "from": "gpt", "value": "(A) matte blue jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/150561ae61d102dd.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) black hoodie at center (B) matte black camera at center" }, { "from": "gpt", "value": "(A) black hoodie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86c349af515af6a5.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is navy blue fabric us navy shirt at center located relative to navy blue uniform at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/535250b8bce23ea8.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the silver metallic tripod at center among (A) pink fabric shirt at center (B) blue denim jeans at center (C) matte gray shirt at left?" }, { "from": "gpt", "value": "(C) matte gray shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5739c177d63e188.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte house at center appear over white matte wall at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white matte house at center is positioned over white matte wall at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d90e88fc0284872d.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy bath at lower center have a smaller size compared to chrome metallic shower head at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white glossy bath at lower center is not smaller in size than chrome metallic shower head at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca21949fd73c6bbd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.447, 0.917) (B) (0.192, 0.633) (C) (0.287, 0.373)" }, { "from": "gpt", "value": "(B) (0.192, 0.633)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/179bf19f93958118.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray stone gravestone at center appear under speckled stone gravestone at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, gray stone gravestone at center is above speckled stone gravestone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa2ef636c17212e3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the matte black bowl at upper center? (A) matte black bowl at center (B) white glossy teeth at upper center" }, { "from": "gpt", "value": "(B) white glossy teeth at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c09ebd52b4d1c25.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the dark textured shirt at center? (A) smooth skin figure at center (B) smooth black mask at center" }, { "from": "gpt", "value": "(B) smooth black mask at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2b8741bf46dae1e.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the blonde hair boy at center? Choose from: (A) black fabric flag at left (B) metallic car trunk at center (C) red fabric cap at center" }, { "from": "gpt", "value": "(C) red fabric cap at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc56bdbda0fb3f67.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the maroon sweater at center? Choose among these: (A) light gray shirt at center (B) brown glossy horse at center (C) gray cotton shirt at right (D) brown woolen jacket at center" }, { "from": "gpt", "value": "(D) brown woolen jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50221cd74483216b.jpg", "conversations": [ { "from": "human", "value": "\nDoes jeans at upper left appear on the left side of white pants at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, jeans at upper left is positioned on the left side of white pants at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5172d929b8d14ae3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if printed fabric blouse at center is positioned above blue paperboard at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f19b756b1a1cb73.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) cracked porcelain sink at lower center (B) cracked porcelain sink at center (C) white textured radiator at center (D) white plastic towel bar at upper center" }, { "from": "gpt", "value": "(D) white plastic towel bar at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e45c903c149d345.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of brown wooden door at center more distant than that of white glossy table at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4686fadc7273972.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) translucent plastic jar at center (B) translucent glass jar at center (C) matte black comb at upper left" }, { "from": "gpt", "value": "(B) translucent glass jar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd5ff2451826185f.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the denim jeans at left? (A) dark blue jeans at center (B) matte black face at center (C) blue plastic license plate at center" }, { "from": "gpt", "value": "(A) dark blue jeans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/651bd9f680eb0afe.jpg", "conversations": [ { "from": "human", "value": "\nIs orange plastic traffic cone at lower left positioned behind orange reflective cone at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, orange plastic traffic cone at lower left is behind orange reflective cone at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e1f21534677c8b8.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fluffy cloud at upper center appear under green leafy tree at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white fluffy cloud at upper center is positioned under green leafy tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d017f620dc2925be.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte laptop at center is bigger than black plastic microphone at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9227b5a7bc59696a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.471, 0.661) (B) (0.373, 0.905)" }, { "from": "gpt", "value": "(A) (0.471, 0.661)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c619382624357a08.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.701, 0.419) (B) (0.910, 0.880)" }, { "from": "gpt", "value": "(A) (0.701, 0.419)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5c8c09f49475b7c.jpg", "conversations": [ { "from": "human", "value": "\nDoes bronze statue at center come behind yellow fabric flag at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, bronze statue at center is behind yellow fabric flag at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ebf414cc469808b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the leather jacket at upper center? Choose among these: (A) black cotton shirt at center (B) dark blue shirt at upper center" }, { "from": "gpt", "value": "(A) black cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ab1c6151f3b0fa9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) gray rock mountain at center (B) green leafy tree at lower center (C) green textured pine trees at center" }, { "from": "gpt", "value": "(A) gray rock mountain at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1461eb3a7db10f2.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the brown woolen sweater at right? (A) framed paper at upper left (B) black matte t-shirt at left (C) wooden picture frame at center" }, { "from": "gpt", "value": "(A) framed paper at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6969194294fd7c00.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green matte leaf at upper center (B) pink matte flower at upper right" }, { "from": "gpt", "value": "(A) green matte leaf at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8965668f3a0ed86.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of clear glass window at upper center in relation to black fur cat at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/970270592b086274.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the green leafy tree at center? Choose from: (A) matte black picnic table at lower left (B) dark gray wood bench at lower left (C) brown wooden pavilion at center (D) smooth gray bench at lower center" }, { "from": "gpt", "value": "(C) brown wooden pavilion at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8f982fff136fa6f.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the white plastic bag at lower right? (A) white plastic bag at upper center (B) white matte tray at center" }, { "from": "gpt", "value": "(A) white plastic bag at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f93325ebe6be9ee.jpg", "conversations": [ { "from": "human", "value": "\nIs white plastic scale at center behind red digital display at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white plastic scale at center is in front of red digital display at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e971eaa3ab8d608e.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the matte black hair at center? Choose from: (A) yellow fabric tank top at center (B) clear plastic bottle at lower right (C) matte black dress at center" }, { "from": "gpt", "value": "(B) clear plastic bottle at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/617e96b908f05baf.jpg", "conversations": [ { "from": "human", "value": "\nDoes printed fabric blouse at center lie in front of black shiny hair at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, printed fabric blouse at center is in front of black shiny hair at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ab35fd3a021c859.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if camouflage fabric robe at center is smaller than blonde silky hair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afb34b796d726f97.jpg", "conversations": [ { "from": "human", "value": "\nIs orange patterned shirt at center to the right of floral fabric shirt at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, orange patterned shirt at center is to the right of floral fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21bb570e3d05c0e1.jpg", "conversations": [ { "from": "human", "value": "\nDoes white floral apron at center have a larger size compared to breaded golden-brown hamburger at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white floral apron at center is bigger than breaded golden-brown hamburger at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4725ee9458f12ca2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white fabric at center (B) smooth red tablecloth at center" }, { "from": "gpt", "value": "(A) white fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ee082067cba1033.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) dry grass at center (B) brown leather horse at center" }, { "from": "gpt", "value": "(A) dry grass at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16503892f34e3c24.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.119, 0.703) (B) (0.678, 0.453)" }, { "from": "gpt", "value": "(B) (0.678, 0.453)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05fef9aee695cf9a.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the orange printed swimsuit at center among (A) green leafy palm tree at upper center (B) transparent blue water at center?" }, { "from": "gpt", "value": "(A) green leafy palm tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/726d01554ba3b022.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of striped cotton shirt at center in relation to dark brown leather backpack at lower left? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0115a11822303c20.jpg", "conversations": [ { "from": "human", "value": "\nIs dark blue suit at left positioned before blue matte dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51752820d6526004.jpg", "conversations": [ { "from": "human", "value": "\nDoes glassy steel skyscraper at center appear on the right side of gray glass skyscraper at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, glassy steel skyscraper at center is to the left of gray glass skyscraper at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcdd7bb2c9eecce5.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of wooden bird feeder at center in reference to wooden mailbox at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/356bfd208b35d4b1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.642, 0.722) (B) (0.429, 0.564) (C) (0.210, 0.714) (D) (0.502, 0.281)" }, { "from": "gpt", "value": "(B) (0.429, 0.564)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a8add1198c338b0.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue matte shirt at center lie behind shiny blue robot at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34dac64942120ed1.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.825, 0.450) (B) (0.201, 0.270) (C) (0.520, 0.750) (D) (0.577, 0.584)" }, { "from": "gpt", "value": "(B) (0.201, 0.270)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b3fa70b66d39c96.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.778, 0.578) (B) (0.529, 0.705)" }, { "from": "gpt", "value": "(A) (0.778, 0.578)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0a1292e4cd9f830.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of green leafy vegetable at center in reference to white matte rice at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60a2ff926a20303a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) black wood picture frame at upper center (B) matte purple fabric lampshade at left (C) white textured bed at center" }, { "from": "gpt", "value": "(A) black wood picture frame at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8a8905b803b3954.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is wooden rocking chair at center located relative to pink striped shorts at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7c2988fbe703684.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) matte black suit at center (B) black polka dot scarf at upper left" }, { "from": "gpt", "value": "(A) matte black suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7f83bd6894a6587.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic staircase at lower left thinner than metallic gray stairs at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, metallic staircase at lower left's width is not less than metallic gray stairs at lower left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf4b56817c2e362a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray water at lower center is wider than green leafy tree at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, dark gray water at lower center is wider than green leafy tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4faaa22ba31af99.jpg", "conversations": [ { "from": "human", "value": "\nIs golden leafy tree at center wider than white glossy rail at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of golden leafy tree at center exceeds that of white glossy rail at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6be6bceaff08f54.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at left thinner than white plastic boat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b86051b4c5a69a76.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the dark brown glass bottle at lower left? Choose from: (A) transparent glass at center (B) translucent glass wine at center (C) matte orange strapless dress at center (D) beige textured suit at center" }, { "from": "gpt", "value": "(B) translucent glass wine at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28b55162c1c4fa17.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green leafy tree at upper center (B) white stone rose window at center (C) green leafy tree at upper left (D) green leafy tree at left" }, { "from": "gpt", "value": "(A) green leafy tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9625ff3770401b9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) metallic silver surgical instruments at upper right (B) rubber glove at center (C) beige rubber glove at left" }, { "from": "gpt", "value": "(C) beige rubber glove at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43832bbd96c12ccf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) dark gray suit at left (B) dark gray hoodie at center (C) white matte projector screen at upper center" }, { "from": "gpt", "value": "(B) dark gray hoodie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60a3a338c2f9c835.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) white smooth egret at right (B) dark blue water at lower left" }, { "from": "gpt", "value": "(A) white smooth egret at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51490ea4079c9a05.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown rough tree at center is positioned to the right of green matte helmet at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown rough tree at center is to the right of green matte helmet at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49c7ffc6211a0264.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.896, 0.256) (B) (0.611, 0.719) (C) (0.479, 0.736) (D) (0.722, 0.684)" }, { "from": "gpt", "value": "(A) (0.896, 0.256)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8925a3c4bd435bda.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte glass bottle at center have a greater width compared to shiny silver bottle at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte glass bottle at center's width does not surpass shiny silver bottle at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c28f5b9d1700126.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) shiny dark brown hair at center (B) curly black hair at upper right (C) curly blonde hair at lower right (D) gold shiny hair clip at upper right" }, { "from": "gpt", "value": "(C) curly blonde hair at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/321a6ab272c7f76b.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at upper center have a smaller size compared to white matte ferry at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green leafy tree at upper center is not smaller in size than white matte ferry at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39cd386c0133b960.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.393, 0.353) (B) (0.323, 0.467) (C) (0.929, 0.597) (D) (0.743, 0.341)" }, { "from": "gpt", "value": "(D) (0.743, 0.341)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f6db170cde99dbe.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.948, 0.309) (B) (0.601, 0.247) (C) (0.776, 0.166)" }, { "from": "gpt", "value": "(A) (0.948, 0.309)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4c7b482e8995b1a.jpg", "conversations": [ { "from": "human", "value": "\nIs cloudy sky at upper center to the right of white textured buildings at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, cloudy sky at upper center is to the right of white textured buildings at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/825f9e32d4ca2490.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) green water at lower left (B) light blue jeans at lower left (C) green leafy tree at center" }, { "from": "gpt", "value": "(A) green water at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97b0182c6eb7f15b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if purple cotton blanket at center is smaller than white matte car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, purple cotton blanket at center has a smaller size compared to white matte car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3ecf7fe0a332c19.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black jacket at upper left is positioned below matte black shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, matte black jacket at upper left is above matte black shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0665674c5c743657.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the blue printed blouse at center? (A) wooden table at left (B) wooden table at center (C) light brown wooden table at center" }, { "from": "gpt", "value": "(C) light brown wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/474c5d74e58f1c51.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth gray shark at center have a larger size compared to silvery metallic fish at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/808d504a39c4135d.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green leafy tree at center located in relation to green leafy tree at lower right in the image? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33cf31e0151778c3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) gray matte skull at upper right (B) green striped sweater at center" }, { "from": "gpt", "value": "(A) gray matte skull at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5794a60374ed787.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) shiny brown otter at center (B) shiny brown otter at left" }, { "from": "gpt", "value": "(A) shiny brown otter at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/520b31462c5a6e1e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black suit at center is smaller than black woolen coat at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte black suit at center occupies less space than black woolen coat at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/004c196c18277e76.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte jacket at center is positioned to the right of matte black phone at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, black matte jacket at center is to the left of matte black phone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b8efc7a695161a5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the white smooth building at center? Choose among these: (A) white glossy building at center (B) concrete bridge at center" }, { "from": "gpt", "value": "(B) concrete bridge at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc045b9984aa3839.jpg", "conversations": [ { "from": "human", "value": "\nIs light gray fabric jacket at center positioned at the back of white cotton t-shirt at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of white cotton t-shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dba6a06627b36db7.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown feathered chicken at center have a lesser width compared to black feathered chicken at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27248521e1fbf6dd.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) dark blue leather jacket at center (B) silver metallic shopping cart at lower right" }, { "from": "gpt", "value": "(B) silver metallic shopping cart at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/caf37e454ee27fb0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red backpack at right is wider than red matte backpack at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of red backpack at right exceeds that of red matte backpack at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1c1e25a52619eff.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dark blue denim jeans at center (B) brown wooden bench at center" }, { "from": "gpt", "value": "(A) dark blue denim jeans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/848852df52574d13.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the matte black shirt at center from the following options: (A) white matte shirt at center (B) gray cotton shirt at right (C) light brown hair at center?" }, { "from": "gpt", "value": "(C) light brown hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd6cc29e3dcc4b3f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.105, 0.438) (B) (0.522, 0.336) (C) (0.316, 0.625)" }, { "from": "gpt", "value": "(A) (0.105, 0.438)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d48d00acd82ef550.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte golf shirt at center below matte black golf bag at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white matte golf shirt at center is below matte black golf bag at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6a9d841e7f84a28.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.301, 0.645) (B) (0.788, 0.503)" }, { "from": "gpt", "value": "(A) (0.301, 0.645)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f60748d39a7a5af.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) striped cotton shirt at center (B) dark blue shirt at lower left (C) matte green backpack at center" }, { "from": "gpt", "value": "(C) matte green backpack at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b02be9764832be92.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.642, 0.309) (B) (0.392, 0.881)" }, { "from": "gpt", "value": "(A) (0.642, 0.309)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/738c267a7a579f4e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.722, 0.672) (B) (0.442, 0.289)" }, { "from": "gpt", "value": "(B) (0.442, 0.289)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2419137f9405a2e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green glossy leafy plant at center (B) wooden fish pond at center" }, { "from": "gpt", "value": "(B) wooden fish pond at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae6fa719a5c7dbb1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte board at center is positioned below blue fabric jacket at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12ad9fe5068ed785.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte thatched hut at left have a smaller size compared to thatched straw hut at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte thatched hut at left is not smaller than thatched straw hut at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93c63b4e190dd827.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.826, 0.572) (B) (0.202, 0.738)" }, { "from": "gpt", "value": "(A) (0.826, 0.572)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44bb14b51f9ebec2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) green leafy plant at upper left (B) brown/scaly snake at center" }, { "from": "gpt", "value": "(A) green leafy plant at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db74e3d7eec2bea3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) green leafy palm tree at upper left (B) brown thatch roof at center" }, { "from": "gpt", "value": "(B) brown thatch roof at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6b12c2a1d00e07a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.913, 0.556) (B) (0.325, 0.575) (C) (0.479, 0.523)" }, { "from": "gpt", "value": "(A) (0.913, 0.556)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93fea898c102d1bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.463, 0.627) (B) (0.269, 0.766)" }, { "from": "gpt", "value": "(B) (0.269, 0.766)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/586e7c3447328935.jpg", "conversations": [ { "from": "human", "value": "\nDoes white frothy water at center have a greater width compared to brown leather jacket at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white frothy water at center is wider than brown leather jacket at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7c531d99d194c89.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the white fabric table at lower right? Choose among these: (A) white fabric table at center (B) matte white shirt at center (C) orange printed shirt at center" }, { "from": "gpt", "value": "(C) orange printed shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99176f4ceb4ce1e4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if striped fabric person at center is thinner than smooth brown hair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, striped fabric person at center is not thinner than smooth brown hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6a9095491f43337.jpg", "conversations": [ { "from": "human", "value": "\nIs whiteboard at upper center thinner than wooden table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, whiteboard at upper center might be wider than wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/704b12dc4cfea8c0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.503, 0.367) (B) (0.016, 0.903)" }, { "from": "gpt", "value": "(A) (0.503, 0.367)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b43308088ff8caae.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the gray cotton t-shirt at center? Choose from: (A) matte red t-shirt at left (B) gray matte beard at center" }, { "from": "gpt", "value": "(B) gray matte beard at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/489eb99288d80fe3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if denim shorts at center is bigger than metallic silver hammer at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, denim shorts at center is larger in size than metallic silver hammer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dffb179595a71f2d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) chocolatesmoothcake at center (B) blue matte shirt at center" }, { "from": "gpt", "value": "(A) chocolatesmoothcake at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4881480f78a7ec8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) green grass at lower center (B) yellow reflective vest at center (C) white wooden bench at upper right (D) green patina sculpture at center" }, { "from": "gpt", "value": "(A) green grass at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd6e5b75b854ab9c.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the matte gold dress at center? Choose from: (A) matte black dress at lower left (B) blue cotton polo shirt at center" }, { "from": "gpt", "value": "(A) matte black dress at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/054c00e637d42377.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.341, 0.931) (B) (0.980, 0.633)" }, { "from": "gpt", "value": "(A) (0.341, 0.931)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26608e805c71e7ca.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear water at center is positioned above blue fabric bikini at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc983501b225166b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) gray stone church at center (B) smooth stone tower at center" }, { "from": "gpt", "value": "(B) smooth stone tower at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88318368c8ddac40.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the black matte dress at center among (A) shiny red dress at center (B) gold sequined dress at center (C) white satin shirt at center?" }, { "from": "gpt", "value": "(C) white satin shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80cbb582d35507e9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic green car at center is wider than white plastic license plate at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, metallic green car at center might be narrower than white plastic license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11e76c5951f6ff05.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white smooth pillar at right (B) green painted wood sign at upper center (C) green painted wood door at center" }, { "from": "gpt", "value": "(A) white smooth pillar at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e092dd1d60368042.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the translucent glass wine at right? (A) matte green shirt at center (B) translucent glass wine at center" }, { "from": "gpt", "value": "(B) translucent glass wine at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d364effd4bc2b65.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte orange dress at center is positioned to the right of black wool suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find matte orange dress at center to the right of black wool suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93da14cee7bdf51b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.178, 0.703) (B) (0.849, 0.458)" }, { "from": "gpt", "value": "(B) (0.849, 0.458)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0147a55ac7b7f30.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) green water at center (B) matte black dress at left (C) black fabric chair at center (D) teal printed dress at center" }, { "from": "gpt", "value": "(A) green water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58ab05e88ee209e7.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue shirt at center have a larger size compared to clear water at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, matte blue shirt at center might be smaller than clear water at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6efcabe387794aaa.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte gray dress at center in relation to gray leather dress at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c556888e37cfa4e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) green satin skirt at center (B) velvet brown coat at center (C) rainbow satin costume at center, is positioned farthest from the black wool coat at center?" }, { "from": "gpt", "value": "(C) rainbow satin costume at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16ba012275f8fb96.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the stone ruins at center? (A) light beige sweater at lower left (B) black plastic goggles at lower left" }, { "from": "gpt", "value": "(B) black plastic goggles at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a466b17b99b7bcc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.088, 0.395) (B) (0.746, 0.570) (C) (0.263, 0.536)" }, { "from": "gpt", "value": "(A) (0.088, 0.395)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24598f5802ec5d17.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.250, 0.636) (B) (0.581, 0.106)" }, { "from": "gpt", "value": "(B) (0.581, 0.106)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06c4bf3a3ad3ec3e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.587, 0.378) (B) (0.480, 0.417)" }, { "from": "gpt", "value": "(B) (0.480, 0.417)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/472425db6ece4b3b.jpg", "conversations": [ { "from": "human", "value": "\nIs white t-shirt at left closer to camera compared to brown leather belt at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white t-shirt at left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e03ac8627ab016c0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) metallic silver bicycle at center (B) green matte shorts at center" }, { "from": "gpt", "value": "(B) green matte shorts at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f376c39c93a67e6b.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden picture frame at center positioned in front of black silk tie at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b87bb4f018629582.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the brown sandy dirt track at center from the following options: (A) brown glossy horse at center (B) brown glossy horse at right?" }, { "from": "gpt", "value": "(A) brown glossy horse at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8edf074fdcf7348.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray matte mud at left have a smaller size compared to matte gray mud at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d42e1eb474ec4b6c.jpg", "conversations": [ { "from": "human", "value": "\nIs orange plastic canoe at center smaller than wooden paddle at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, orange plastic canoe at center has a smaller size compared to wooden paddle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e44f008c67d81af.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.000, 0.988) (B) (0.029, 0.464) (C) (0.965, 0.950)" }, { "from": "gpt", "value": "(C) (0.965, 0.950)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/032f01960ad7eda1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.070, 0.463) (B) (0.523, 0.759) (C) (0.794, 0.362)" }, { "from": "gpt", "value": "(A) (0.070, 0.463)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcb2df5e2f193e10.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth skin hand at upper left bigger than chocolate matte ice cream at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, smooth skin hand at upper left has a larger size compared to chocolate matte ice cream at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b9f67484633d6b5.jpg", "conversations": [ { "from": "human", "value": "\nWhere is maroon sweater at left located in relation to black matte shirt at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bae591537d128745.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black jacket at left closer to camera compared to striped fabric face at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of striped fabric face at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e08bd97aa4c5015.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the wooden table at upper center? Choose among these: (A) dark gray hoodie at center (B) wooden table at center" }, { "from": "gpt", "value": "(A) dark gray hoodie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51c42433fbc8ffa3.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black phone at center appear over light brown suede jacket at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, matte black phone at center is positioned over light brown suede jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5cd141930af353d5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) brown leather jacket at lower center (B) white glossy pillar at center" }, { "from": "gpt", "value": "(B) white glossy pillar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe08ce283ed9fe00.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.377, 0.547) (B) (0.535, 0.619) (C) (0.932, 0.531) (D) (0.050, 0.653)" }, { "from": "gpt", "value": "(C) (0.932, 0.531)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0999dc2b518136a8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.413, 0.431) (B) (0.021, 0.798) (C) (0.857, 0.445) (D) (0.270, 0.203)" }, { "from": "gpt", "value": "(B) (0.021, 0.798)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c1c571eed0bb643.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) gray hoodie at center (B) wooden table at center" }, { "from": "gpt", "value": "(B) wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5688660228c5446.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is gray textured blazer at center located relative to dark gray suit at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8bfc28b64cc2b995.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy trees at center lie behind green leafy palm at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy trees at center is behind green leafy palm at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f4350ec926fc301.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) light brown wooden post at center (B) neon green shorts at left" }, { "from": "gpt", "value": "(B) neon green shorts at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4548b7580e3c2a5e.jpg", "conversations": [ { "from": "human", "value": "\nDoes green pine tree at center have a lesser width compared to greenish reflective water at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green pine tree at center is not thinner than greenish reflective water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/103a938844b403bd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.760, 0.986) (B) (0.987, 0.698) (C) (0.188, 0.830)" }, { "from": "gpt", "value": "(A) (0.760, 0.986)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34ec86ac892ff29c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.678, 0.650) (B) (0.374, 0.375)" }, { "from": "gpt", "value": "(B) (0.374, 0.375)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58c95a0de2cc14fb.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink fabric hair at lower center appear on the right side of brown hair at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find pink fabric hair at lower center to the right of brown hair at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/785353639563fb55.jpg", "conversations": [ { "from": "human", "value": "\nIs teal fabric canopy at upper center to the left of teal painted wood pole at right from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find teal fabric canopy at upper center to the left of teal painted wood pole at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b4e282ad1e8539b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white fabric flag at center is positioned above shiny plastic beads at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white fabric flag at center is positioned over shiny plastic beads at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adc32596f2bd43a9.jpg", "conversations": [ { "from": "human", "value": "\nDoes beige stone building at center lie in front of white glossy building at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a37f2723b15806dc.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white matte shirt at left (B) white glossy airplane at right" }, { "from": "gpt", "value": "(B) white glossy airplane at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a198edf0d892a177.jpg", "conversations": [ { "from": "human", "value": "\nIs light blue fabric at center smaller than dark blue fabric at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, light blue fabric at center is not smaller than dark blue fabric at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38e1160f9d542a19.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black blazer at center have a lesser width compared to black silk suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black blazer at center is not thinner than black silk suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70a3a559a50fe0ba.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy plate at center further to camera compared to shiny metallic spoon at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of shiny metallic spoon at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/920e0af0601be72d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if tan rubber slide at left is positioned to the left of matte green shirt at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, tan rubber slide at left is not to the left of matte green shirt at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/069ce9f6a3386bc8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.817, 0.695) (B) (0.430, 0.247) (C) (0.339, 0.630)" }, { "from": "gpt", "value": "(C) (0.339, 0.630)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d76ede9196421ad1.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton crowd at upper center to the right of black uniform at lower left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find white cotton crowd at upper center to the right of black uniform at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/675d4113c1f36721.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if multicolored mosaic door at center is bigger than pink matte heart at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cae45fb105026782.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown leafless tree at center is thinner than green leafy tree at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b69fad1ce7f14c75.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) gray concrete pavement at center (B) dark brown bark at right" }, { "from": "gpt", "value": "(A) gray concrete pavement at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a6bc0a0004e9ff5.jpg", "conversations": [ { "from": "human", "value": "\nIs brown glossy horse at center thinner than orange jersey at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, brown glossy horse at center might be wider than orange jersey at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ead864af1c877051.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the green leafy tree at upper center? Choose from: (A) dark brown stone gravestone at lower left (B) green leafy palm tree at center" }, { "from": "gpt", "value": "(A) dark brown stone gravestone at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/deb5b755670cd89d.jpg", "conversations": [ { "from": "human", "value": "\nDoes fluffy yellow chick at center have a greater width compared to soft yellow chick at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd9b5bd60563d9f7.jpg", "conversations": [ { "from": "human", "value": "\nIs brown speckled pigeon at center thinner than brown speckled sparrow at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/483686d909fafcb6.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the dark gray elephant at center from the following options: (A) dark asphalt road at center (B) green leafy palm tree at center (C) black matte cow at center?" }, { "from": "gpt", "value": "(B) green leafy palm tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd250cc660ad4c34.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.517, 0.317) (B) (0.940, 0.373) (C) (0.592, 0.380)" }, { "from": "gpt", "value": "(A) (0.517, 0.317)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/416254c982a4606c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.501, 0.384) (B) (0.749, 0.959) (C) (0.049, 0.477)" }, { "from": "gpt", "value": "(B) (0.749, 0.959)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b32e7d7c91ae1217.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) green water at lower center (B) blue fabric shorts at right" }, { "from": "gpt", "value": "(A) green water at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c7d1ef97f06029a.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown pants at left to the right of matte brown jacket at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, matte brown pants at left is to the left of matte brown jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/131b869d35392ab7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) green grass at lower center (B) green concrete pipes at lower center (C) yellow rubber tractor at left" }, { "from": "gpt", "value": "(A) green grass at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df1bba8bb35a85ab.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte trees at center wider than dark green textured tree at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of green matte trees at center exceeds that of dark green textured tree at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4837c82d24c2b85.jpg", "conversations": [ { "from": "human", "value": "\nDoes black fabric shirt at lower left appear on the left side of white paper at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find black fabric shirt at lower left to the left of white paper at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c55117172f883408.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) red matte shirt at center (B) gray cotton t-shirt at right (C) grilled sausage at center (D) matte red grill at center" }, { "from": "gpt", "value": "(D) matte red grill at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81aa1088681a3a44.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy surfboard at center above black matte wetsuit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white glossy surfboard at center is not above black matte wetsuit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d77c0b0c6d141c5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the metallic silver water tower at center right? Select from: (A) green leafy tree at left (B) metallic column at center (C) green leafy tree at right" }, { "from": "gpt", "value": "(B) metallic column at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99fec804dff790e5.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden bench at center have a smaller size compared to black leather jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, wooden bench at center is not smaller than black leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4e8f3aacb42a9c3.jpg", "conversations": [ { "from": "human", "value": "\nIs brown feathered bald eagle at center positioned behind brown rough tree branch at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown feathered bald eagle at center is further from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d7248c756119859.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if cloudy sky at upper center is positioned above green grass at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/278d150a1bf712b0.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is gray cotton jacket at center located relative to striped cotton shirt at lower left? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a86ec4b56f58f72.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black bookshelf at upper center appear under cardboard box at center-right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, matte black bookshelf at upper center is above cardboard box at center-right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f42b89731688d50.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green grassy pond at center (B) green textured trees at upper right" }, { "from": "gpt", "value": "(B) green textured trees at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba2065bdd4325633.jpg", "conversations": [ { "from": "human", "value": "\nDoes white smooth shirt at center have a larger size compared to white floral petals at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white smooth shirt at center has a larger size compared to white floral petals at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9fd825e6500ab21.jpg", "conversations": [ { "from": "human", "value": "\nIs gray patterned shirt at center bigger than patterned fabric arm at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, gray patterned shirt at center is bigger than patterned fabric arm at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45cedf7fcafc0c51.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.162, 0.469) (B) (0.184, 0.745) (C) (0.595, 0.759)" }, { "from": "gpt", "value": "(A) (0.162, 0.469)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3568b9f5b651b774.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of dark brown hair at upper right and camouflage-patterned snake at center in the image provided, where is dark brown hair at upper right located with respect to camouflage-patterned snake at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3500dfb99ccef1cd.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green puffy jacket at lower right is positioned to the right of white knit hat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green puffy jacket at lower right is positioned on the right side of white knit hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44cfb76d5effd5d7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.931, 0.183) (B) (0.401, 0.411)" }, { "from": "gpt", "value": "(B) (0.401, 0.411)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8d3426af2cfb186.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) black silk tie at right (B) matte black suit at left" }, { "from": "gpt", "value": "(A) black silk tie at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6224291982cb526.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of black pinstripe suit at center less distant than that of blonde curly hair at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, black pinstripe suit at center is behind blonde curly hair at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be88cb8f4569f3b4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.632, 0.475) (B) (0.624, 0.239)" }, { "from": "gpt", "value": "(B) (0.624, 0.239)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f5ce538c4f87361.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center above brown stone church at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, green grass at center is below brown stone church at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5b9feb9f5192568.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the black satin kimono at center? Choose from: (A) red satin sandal at center (B) shiny red sandal at center" }, { "from": "gpt", "value": "(B) shiny red sandal at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23a6c7414acef732.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) gray gravelly sand at center (B) blue water at center" }, { "from": "gpt", "value": "(A) gray gravelly sand at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d58af682a075f27.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white stone church at center is smaller than metallic silver car at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9407f2231a7aad58.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.784, 0.252) (B) (0.151, 0.984) (C) (0.406, 0.311)" }, { "from": "gpt", "value": "(B) (0.151, 0.984)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f092302e00e23e6.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green matte/glossy bass guitar at left in relation to matte white monitor at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c17c0abada9b08bd.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) green rubber curb at lower center (B) green matte license plate at lower right" }, { "from": "gpt", "value": "(A) green rubber curb at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e0a8c0e4f69a29f.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton shirt at center above white matte forehead at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60469448d2e21dc6.jpg", "conversations": [ { "from": "human", "value": "\nIs black velvet curtain at left to the right of matte gray sweater at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black velvet curtain at left is not to the right of matte gray sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc8b0cf13c728388.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.899, 0.427) (B) (0.444, 0.489)" }, { "from": "gpt", "value": "(B) (0.444, 0.489)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45f86ad20755b01b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brick theater at center is thinner than blue fabric backpack at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, brick theater at center's width is not less than blue fabric backpack at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13368ea548e1c745.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) silhouette fishing rod at left (B) clear water at railing left (C) black fabric cap at upper right (D) dark blue jeans at center" }, { "from": "gpt", "value": "(B) clear water at railing left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/400c82a6afd5a6d8.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the yellow-green leafy tree at upper center from the following options: (A) green matte evergreen tree at upper center (B) clear water at center (C) green matte tree at upper center (D) orange autumn leaves at left?" }, { "from": "gpt", "value": "(D) orange autumn leaves at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d9bcd9c48ec69c7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark green sweater at center is smaller than brown cardboard box at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, dark green sweater at center might be larger than brown cardboard box at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a7c50aa91395e27.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) yellow matte toy car at center (B) gray plastic baby carriage at upper center" }, { "from": "gpt", "value": "(B) gray plastic baby carriage at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cafdb1e025e0efa6.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow matte van at lower right positioned at the back of shiny black car at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, yellow matte van at lower right is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bb13255b2a01ea9c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.601, 0.330) (B) (0.682, 0.919) (C) (0.616, 0.239)" }, { "from": "gpt", "value": "(B) (0.682, 0.919)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52663bf3eb9fd578.jpg", "conversations": [ { "from": "human", "value": "\nDoes natural bamboo wind chime at center appear under white driftwood branch at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, natural bamboo wind chime at center is located below white driftwood branch at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/972693fbf213ceb5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the dark suit at center? Select from: (A) dark pinstripe suit at center (B) matte black suit at center (C) gray textured blazer at center" }, { "from": "gpt", "value": "(B) matte black suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07367b6b69a006c0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte leather shoe at lower left (B) brown leather shoe at lower right" }, { "from": "gpt", "value": "(B) brown leather shoe at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b534204e8e2e6dd.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of plaid fabric shirt at left in reference to pink matte hand at upper center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac4b6af6f0c47031.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the golden crispy chicken at lower left? Choose among these: (A) crumbly golden bread at center (B) striped cotton shirt at center" }, { "from": "gpt", "value": "(B) striped cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e639613024d13d1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) green leafy tree at upper right (B) green reflective water at center" }, { "from": "gpt", "value": "(A) green leafy tree at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02e6eac200a8c298.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy shirt at center is wider than white shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white glossy shirt at center is not wider than white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91cf5ba41915e57d.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white satin blouse at center and orange fleece jacket at right in the image provided, where is white satin blouse at center located with respect to orange fleece jacket at right? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/edc44b2375642e1b.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the matte coral dress at center among (A) asphalt road at center (B) blue plaid umbrella at center (C) pale pink fabric dress at center?" }, { "from": "gpt", "value": "(C) pale pink fabric dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f919f5560a230115.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.684, 0.566) (B) (0.466, 0.569) (C) (0.625, 0.534) (D) (0.523, 0.667)" }, { "from": "gpt", "value": "(D) (0.523, 0.667)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ad7f19abb23c81b.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is green leafy tree at center located relative to matte black bust at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ff2306c06e554a3.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of black satin abaya at center less distant than that of black metallic car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27d75adfef426b49.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.113, 0.312) (B) (0.969, 0.605)" }, { "from": "gpt", "value": "(B) (0.969, 0.605)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15ce8034935e3845.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gray suit at center positioned behind matte gray jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c854a8667008d8e9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.944, 0.308) (B) (0.438, 0.395)" }, { "from": "gpt", "value": "(A) (0.944, 0.308)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b90cb7fe79dae1fa.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fabric apron at right further to camera compared to matte purple shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of matte purple shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/048016b953099bf4.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton shirt at lower right below light orange t-shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3797cc12e454859e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte black sign at center (B) matte red sign at center (C) white plastic tricycle at center" }, { "from": "gpt", "value": "(A) matte black sign at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f684ecf3722ac15.jpg", "conversations": [ { "from": "human", "value": "\nIs brown mud at lower right to the right of brown wooden hut at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, brown mud at lower right is positioned on the right side of brown wooden hut at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2b7a37dc10c174c.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue t-shirt at right appear on the right side of dark blue shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, blue t-shirt at right is to the right of dark blue shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a302920028a609d.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray fabric shirt at center appear under woodenmaterial/texturetable at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, gray fabric shirt at center is not below woodenmaterial/texturetable at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3c7a7d56275979c.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth orange wooden torii gate at center smaller than white stone pillar at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, smooth orange wooden torii gate at center has a smaller size compared to white stone pillar at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9d873c0ce4d3f57d.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden table at lower center positioned behind matte black jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, wooden table at lower center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a2244b500729e7c.jpg", "conversations": [ { "from": "human", "value": "\nIs green textured trees at left closer to the viewer compared to green leafy tree at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green textured trees at left is in front of green leafy tree at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/025899d2103bf10a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.401, 0.764) (B) (0.336, 0.686) (C) (0.360, 0.986) (D) (0.756, 0.639)" }, { "from": "gpt", "value": "(C) (0.360, 0.986)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6341c25e98bbbde.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.599, 0.503) (B) (0.448, 0.133) (C) (0.747, 0.312)" }, { "from": "gpt", "value": "(C) (0.747, 0.312)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1eb22f1c68e42a3.jpg", "conversations": [ { "from": "human", "value": "\nIs orange tabby cat at upper right to the left of tabby fur at left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, orange tabby cat at upper right is not on the left side of tabby fur at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/459fda4131e88048.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray pinstripe suit at center come behind satin silver pole at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b9851b643a760a5.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte duck at center have a larger size compared to brown matte duckling at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black matte duck at center is bigger than brown matte duckling at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba2fc6d5bca20c91.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) black matte sculpture at center (B) green matte shirt at center" }, { "from": "gpt", "value": "(B) green matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42172c6426db09b8.jpg", "conversations": [ { "from": "human", "value": "\nIs green metal fence at center smaller than yellow matte fire hydrant at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green metal fence at center is not smaller than yellow matte fire hydrant at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b91a575573e0ca6f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) black matte microphone at center (B) matte black microphone at center (C) purple glossy computer monitor at lower right (D) skinny white hand at upper center" }, { "from": "gpt", "value": "(C) purple glossy computer monitor at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8428012d8ed77703.jpg", "conversations": [ { "from": "human", "value": "\nIs black leather jacket at left positioned behind leather jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black leather jacket at left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/612c337b21648e55.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue plastic quad bike at center is positioned below gray fabric shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, blue plastic quad bike at center is above gray fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b20cdb1eb0603cf.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) black plastic sunglasses at upper center (B) black leather jacket at left (C) black matte sunglasses at center" }, { "from": "gpt", "value": "(A) black plastic sunglasses at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89a6e6bcfd45262e.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white translucent potatoes at lower left located in relation to white matte dumplings at center in the image? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8670ff5379612931.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at left below dark gray fabric person at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green leafy tree at left is not below dark gray fabric person at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9c7718717b2b10b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.222, 0.223) (B) (0.066, 0.423)" }, { "from": "gpt", "value": "(A) (0.222, 0.223)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3bea6ba76131281.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of metallic silver table at center less distant than that of metallic silver chair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59b7bda4aa48d388.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) black wool coat at center (B) brown leather jacket at center (C) black matte suit at center" }, { "from": "gpt", "value": "(C) black matte suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2232535cc17b816d.jpg", "conversations": [ { "from": "human", "value": "\nIs reflective black water at center wider than light gray shirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, reflective black water at center has a greater width compared to light gray shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00b002a84d61d536.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the black fur dog at center? Select from: (A) clear plastic water bottle at center (B) matte black nose at upper left (C) yellow striped polo shirt at center" }, { "from": "gpt", "value": "(C) yellow striped polo shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca8ad1fa130c8e93.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) gray bark tree at right (B) green leafy tree at left" }, { "from": "gpt", "value": "(B) green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1eaf71908de2156.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if transparent glass water at center is wider than white snow-covered mountain at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, transparent glass water at center's width does not surpass white snow-covered mountain at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ade56ec06e657a83.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.447, 0.694) (B) (0.298, 0.725) (C) (0.508, 0.753) (D) (0.519, 0.659)" }, { "from": "gpt", "value": "(C) (0.508, 0.753)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f904abfd113ef7cc.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red sedan at lower right appear on the right side of metallic blue sedan at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte red sedan at lower right is not to the right of metallic blue sedan at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9d71bdecbd76c57.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the white glossy bird at center from the following options: (A) white glossy bird at upper center (B) white glossy bird at upper left?" }, { "from": "gpt", "value": "(A) white glossy bird at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5da8d4522ab05160.jpg", "conversations": [ { "from": "human", "value": "\nIs green fabric awning at center closer to camera compared to teal fabric signboard at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45d81ec661365900.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark gray rough bark at center located in relation to smooth bark tree trunk at center in the image? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f077af02b420e0da.jpg", "conversations": [ { "from": "human", "value": "\nIs blue metallic crane at center wider than blue metallic crane at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, blue metallic crane at center is not wider than blue metallic crane at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d58a510a759eda7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray rocky mountains at upper center is smaller than green succulent at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, gray rocky mountains at upper center is not smaller than green succulent at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa45f91737a59151.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) dry grass at center (B) brown dry bush at center (C) brown dry wood at center" }, { "from": "gpt", "value": "(A) dry grass at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fafe392c47aeed6a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brick textured archway at center (B) teal matte jacket at center (C) teal fabric jacket at center" }, { "from": "gpt", "value": "(A) brick textured archway at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8aa87cac1d90c7b2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.419, 0.272) (B) (0.236, 0.684) (C) (0.799, 0.736)" }, { "from": "gpt", "value": "(B) (0.236, 0.684)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/310846d1199cda95.jpg", "conversations": [ { "from": "human", "value": "\nIs dark green matte suv at center positioned in front of dark green tank top at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c1cbb9a8a182bfc.jpg", "conversations": [ { "from": "human", "value": "\nIs gray fabric hat at center to the right of green matte bowl at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, gray fabric hat at center is not on the right side of green matte bowl at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d154636e4126b4e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.221, 0.792) (B) (0.899, 0.478)" }, { "from": "gpt", "value": "(B) (0.899, 0.478)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60b9808d3d5f0430.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of clear water at center in relation to spotted fur giraffe at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b481345e2262408d.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte tank top at center have a greater width compared to camouflage fabric suitcase at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e3bbd111139374c.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray smooth hospital bed at center appear under smooth skin baby at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, gray smooth hospital bed at center is not positioned below smooth skin baby at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2885a9d751a9d4c6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cotton shirt at center is positioned above dark gray fabric backpack at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white cotton shirt at center is above dark gray fabric backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74c1f05f07eea827.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if polished chrome mirror at center is thinner than metallic silver clock at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, polished chrome mirror at center is not thinner than metallic silver clock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f8b7a149894ba9c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red cloth table at lower center is positioned to the left of white shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, red cloth table at lower center is to the right of white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88d9c7da6b7d7e3a.jpg", "conversations": [ { "from": "human", "value": "\nDoes white brick building at center appear on the left side of brown brick sign at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white brick building at center is not on the left side of brown brick sign at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16c0aec17c10b7ae.jpg", "conversations": [ { "from": "human", "value": "\nIs silhouette figure at upper right positioned before silhouette jacket at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a8efcc775a54721.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of matte glass building at center and white textured building at right in the image provided, where is matte glass building at center located with respect to white textured building at right? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/591fb3bc773adfb8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.847, 0.741) (B) (0.693, 0.605) (C) (0.758, 0.467)" }, { "from": "gpt", "value": "(C) (0.758, 0.467)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bf50bcf122104da.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the matte red car at center? (A) blue fabric shirt at right (B) shiny red car at center" }, { "from": "gpt", "value": "(B) shiny red car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac42074f753a8818.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.547, 0.350) (B) (0.502, 0.902) (C) (0.404, 0.695)" }, { "from": "gpt", "value": "(B) (0.502, 0.902)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5919970356481fa.jpg", "conversations": [ { "from": "human", "value": "\nIs black smooth shirt at center smaller than matte blue fabric can cooler at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3660dd9149ebe4d.jpg", "conversations": [ { "from": "human", "value": "\nIs white soft baby at center below blue plastic pacifier at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, white soft baby at center is above blue plastic pacifier at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0ad226fa19b745a.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown rough log at lower center come behind brown rough log at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of brown rough log at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3056603b89415ae7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the black satin dress at center? Choose among these: (A) matte black dress at center (B) white ceramic bowl at lower left (C) blue checkered tablecloth at lower right" }, { "from": "gpt", "value": "(A) matte black dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ab1dcac6afe0fb5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.498, 0.834) (B) (0.838, 0.525)" }, { "from": "gpt", "value": "(A) (0.498, 0.834)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5971cf9e15db1c8f.jpg", "conversations": [ { "from": "human", "value": "\nDoes green uniform at center have a lesser width compared to matte green uniform at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, green uniform at center might be wider than matte green uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cea5c748eb41aceb.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.897, 0.713) (B) (0.576, 0.658) (C) (0.110, 0.655)" }, { "from": "gpt", "value": "(A) (0.897, 0.713)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/336d2ead4548b15c.jpg", "conversations": [ { "from": "human", "value": "\nIs white lace dress at upper center behind clear glass wine glass at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white lace dress at upper center is in front of clear glass wine glass at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99302dcd618e8aa8.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) dark gray metallic car at left (B) sleek black sedan at center, is positioned closest to the transparent glass window at upper right?" }, { "from": "gpt", "value": "(B) sleek black sedan at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df6e7747d877711e.jpg", "conversations": [ { "from": "human", "value": "\nDoes light beige leather jacket at center have a greater width compared to brown suede boot at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of light beige leather jacket at center exceeds that of brown suede boot at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5dd228f6c21dac6c.jpg", "conversations": [ { "from": "human", "value": "\nIs pink matte onesie at center below blonde hair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99e1189fb9150f80.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.095, 0.545) (B) (0.442, 0.691)" }, { "from": "gpt", "value": "(A) (0.095, 0.545)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e612f6909373df7c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) hardcover book at center (B) red matte hardcover book at center" }, { "from": "gpt", "value": "(A) hardcover book at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cae75863acecddea.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the white fleece jacket at lower right among (A) white fabric baby carriage at lower left (B) wooden bench at center?" }, { "from": "gpt", "value": "(A) white fabric baby carriage at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3c8a057f4ea9e94.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fluffy cloud at upper center appear under green needle-like at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b88fcd5d8ddb9c42.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the white matte vest at center? (A) matte black sweater at left (B) matte black vest at center (C) red argyle vest at center (D) orange argyle sweater vest at right" }, { "from": "gpt", "value": "(D) orange argyle sweater vest at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/965d4f17e0f2b88d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) orange matte shirt at lower left (B) black matte construction worker at center" }, { "from": "gpt", "value": "(A) orange matte shirt at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d7f227241057466.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the clear stone stream at center? (A) green leafy tree at center (B) green leafy tree at upper center (C) green leafy tree at upper left" }, { "from": "gpt", "value": "(B) green leafy tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a909ca4a9edb600b.jpg", "conversations": [ { "from": "human", "value": "\nIs blue shirt at lower right behind matte white shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ac724174065e2ac.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy palm tree at upper right above shiny black suv at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17899d73a7433151.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the black matte uniform at left? Select from: (A) black matte jacket at lower right (B) black matte uniform at center" }, { "from": "gpt", "value": "(A) black matte jacket at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5a3b9e638ccbdfe.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte antlers at center is wider than matte red sign at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of white matte antlers at center exceeds that of matte red sign at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1552324558926c5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth glossy buoy at center is positioned below white plastic boat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, smooth glossy buoy at center is located below white plastic boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47f07c651bf1871f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if glossy metallic train at center is bigger than white glossy train at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, glossy metallic train at center is bigger than white glossy train at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/856a5b40bea4a6d5.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white fluffy cloud at upper center located relative to yellow matte building at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6c2f5693e61412b.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray fabric jacket at center have a greater width compared to orange fleece jacket at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, gray fabric jacket at center is wider than orange fleece jacket at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a7708eb4bfd68c8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white plastic sewing machine at right (B) pink fleece sweater at upper left (C) matte plastic lamp at upper center" }, { "from": "gpt", "value": "(B) pink fleece sweater at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bb0cb790fa78b65.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny brown horse at center wider than matte black suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, shiny brown horse at center has a greater width compared to matte black suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7fe6f1da771d257.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark brown hair at upper right is positioned to the left of pink matte shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, dark brown hair at upper right is not to the left of pink matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1f8f8d5ddeff6ec.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear water at center appear on the left side of white glossy sailboat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, clear water at center is not on the left side of white glossy sailboat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78b17daa0ac3df66.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.044, 0.175) (B) (0.392, 0.195) (C) (0.315, 0.773)" }, { "from": "gpt", "value": "(C) (0.315, 0.773)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8c42d06d253054f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green leafy bush at center (B) bronze statue at center" }, { "from": "gpt", "value": "(A) green leafy bush at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00761f844a396417.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper center is thinner than matte gray backpack at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, green leafy tree at upper center might be wider than matte gray backpack at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abd5151cae53a325.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green checkered shirt at upper left is positioned above pink polka dot fleece at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, green checkered shirt at upper left is located above pink polka dot fleece at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bed25bcffc1e6a45.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the porcelain plate at upper right? (A) shiny blue cake at center (B) white paper plate at upper right (C) shiny dark chocolate cake at center (D) floral paper plate at upper right" }, { "from": "gpt", "value": "(A) shiny blue cake at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fefa18fba72846a.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth bark tree at center bigger than smooth sand at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, smooth bark tree at center is larger in size than smooth sand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d33ce4ff72d3a29d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the metallic silver microphone at center? Select from: (A) black metallic microphone at lower center (B) matte black suit at center (C) dark gray suit at center (D) purple matte shirt at center" }, { "from": "gpt", "value": "(C) dark gray suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/824e6266cb4c78e8.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red jacket at center above red plastic cup at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte red jacket at center is above red plastic cup at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0c538c77f2b99b5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if denim shorts at center is positioned below blue denim shorts at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, denim shorts at center is above blue denim shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e52f42152f5efd1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if striped shirt at center is smaller than red fabric banner at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d02bdd845577d63c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) green leafy hedge at center (B) green leafy hedge at lower center (C) green leafy tree at left" }, { "from": "gpt", "value": "(A) green leafy hedge at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/399e701f0fc947f2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) white matte shirt at lower right (B) black matte shirt at right" }, { "from": "gpt", "value": "(A) white matte shirt at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d9a10e005b9f0d4.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown pants at center thinner than matte brown jumpsuit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte brown pants at center's width is not less than matte brown jumpsuit at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70b8fec6a649f0b1.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown leather hammer at center come behind matte green figure at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown leather hammer at center is behind matte green figure at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5e85e1fe2e776d7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) black mesh swivel chair at center (B) metallic silver desk lamp at upper center (C) silver metallic laptop at center" }, { "from": "gpt", "value": "(A) black mesh swivel chair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38d27327f378db2e.jpg", "conversations": [ { "from": "human", "value": "\nIs zebra print bikini top at center wider than black matte bikini at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, zebra print bikini top at center is wider than black matte bikini at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a1187fb148376ec.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black microphone at center smaller than light brown leather jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte black microphone at center is not smaller in size than light brown leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00baf4acd29fec99.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy boat at right to the left of wooden at right from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white glossy boat at right is not on the left side of wooden at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67f8fab0de68b80a.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray suede jacket at left appear on the right side of white glossy laptop at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, gray suede jacket at left is not to the right of white glossy laptop at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c9d8148e01153c2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) green fabric dress at center (B) green plastic wheelbarrow at center" }, { "from": "gpt", "value": "(B) green plastic wheelbarrow at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d45e07e45f8496b3.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of dark gray crowd at lower center in reference to black matte shirt at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6af450850d1ffa44.jpg", "conversations": [ { "from": "human", "value": "\nIs matte purple flower at center to the right of plush toy at lower left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte purple flower at center is not on the right side of plush toy at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8accb6906ae49fd0.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fleece jacket at center positioned behind matte red jacket at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/978bb3c2d20790ef.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white fleece jacket at center (B) denim jacket at center" }, { "from": "gpt", "value": "(B) denim jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfae9310292fd1c5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.535, 0.869) (B) (0.060, 0.622)" }, { "from": "gpt", "value": "(B) (0.060, 0.622)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47408558151b9519.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy island at center have a lesser width compared to white matte wing at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e763076e64556d3c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.739, 0.388) (B) (0.460, 0.384) (C) (0.955, 0.580)" }, { "from": "gpt", "value": "(B) (0.460, 0.384)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6adae7e0bfd435c5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the blue cotton t-shirt at upper center? Choose among these: (A) blue cotton t-shirt at center (B) white fabric baseball cap at upper left" }, { "from": "gpt", "value": "(B) white fabric baseball cap at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9308d29a09d2d17.jpg", "conversations": [ { "from": "human", "value": "\nIs olive green uniform at center wider than silver metallic laptop at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, olive green uniform at center is wider than silver metallic laptop at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1eccb346160be1f1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) dark brown corduroy overalls at center (B) black leather jacket at left (C) brown corduroy overalls at center" }, { "from": "gpt", "value": "(B) black leather jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/166659e180fa4e44.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brushed metal cart at center (B) white fabric street vendor at center (C) black chalkboard at center" }, { "from": "gpt", "value": "(A) brushed metal cart at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a275f7f68409126.jpg", "conversations": [ { "from": "human", "value": "\nDoes black and white fur at center appear under white fluffy dog at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c409822a4168c5be.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte shirt at center below silver metallic pendant at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be0bde66371d9729.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) metallic lattice tower at center (B) blue water at lower center" }, { "from": "gpt", "value": "(B) blue water at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79ac7b296d54afc0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) purple fabric at left (B) purple matte sweater at left (C) teal sequined beanie at upper right" }, { "from": "gpt", "value": "(B) purple matte sweater at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a77c680e334645b4.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy at center positioned behind smooth skin man at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green grassy at center is in front of smooth skin man at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06143883a84d69e7.jpg", "conversations": [ { "from": "human", "value": "\nDoes bare wood tree at upper center come behind bare wood tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of bare wood tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7f2d9ccda375ec6.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) matte gold glass at right (B) gold textured glass at center (C) gold textured shot glass at center (D) blue glass at center" }, { "from": "gpt", "value": "(A) matte gold glass at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49fc84cec7dc78b4.jpg", "conversations": [ { "from": "human", "value": "\nIs black woolen robe at center to the right of black matte jacket at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black woolen robe at center is not to the right of black matte jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd6ead69f2f2821f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte pink fabric hat at upper left is positioned to the right of black satin bonnet at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte pink fabric hat at upper left is not on the right side of black satin bonnet at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cea2f95b3cf86621.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the orange matte/soft robe at left? (A) matte yellow robe at center (B) knitted woolen hat at center" }, { "from": "gpt", "value": "(A) matte yellow robe at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4216abc4de07bc45.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink fabric dress at right lie in front of pink fabric dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d704b90defc064f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.291, 0.566) (B) (0.338, 0.755)" }, { "from": "gpt", "value": "(A) (0.291, 0.566)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ccdb5538627156c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown leafy tree at right is positioned to the right of green matte tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown leafy tree at right is to the right of green matte tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afb027e196a20386.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) white fluffy smoke at center (B) white matte glider at center" }, { "from": "gpt", "value": "(B) white matte glider at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6dca823e09b2a5c.jpg", "conversations": [ { "from": "human", "value": "\nIs white satin blouse at center to the left of clear glassware at lower left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white satin blouse at center is not on the left side of clear glassware at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b160245b315f161.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the black matte jacket at center from the following options: (A) white cotton t-shirt at left (B) matte black suit at center (C) gray concrete plaza at center (D) light brown leather jacket at right?" }, { "from": "gpt", "value": "(B) matte black suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/426e7c1013e6670f.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic red car at center to the right of shiny white sedan at center-left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, metallic red car at center is positioned on the right side of shiny white sedan at center-left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a59be664f53ebdd8.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray shirt at center positioned in front of orange fabric bed at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ecd5fd17e82494a8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.253, 0.425) (B) (0.876, 0.705)" }, { "from": "gpt", "value": "(A) (0.253, 0.425)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43a788f49902b610.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) matte black motorcycle at right (B) rusty metal jeep at left" }, { "from": "gpt", "value": "(A) matte black motorcycle at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4cd0093c69a7fce.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) transparent glass canopy at center (B) metallic silver chair at lower center" }, { "from": "gpt", "value": "(A) transparent glass canopy at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c36febc99f43ddc2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.463, 0.484) (B) (0.302, 0.178)" }, { "from": "gpt", "value": "(B) (0.302, 0.178)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/543d9186d97b8a4e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) shiny metallic mask at center (B) brown glossy horse at center" }, { "from": "gpt", "value": "(A) shiny metallic mask at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8b9d7b5bb525c43.jpg", "conversations": [ { "from": "human", "value": "\nIs light gray sweater at center positioned in front of striped shirt at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55a5bde00fa94c07.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of matte black umbrella at center and matte gray hair at lower center in the image provided, where is matte black umbrella at center located with respect to matte gray hair at lower center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5af443e648f75868.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) black matte shirt at center (B) black matte t-shirt at center" }, { "from": "gpt", "value": "(B) black matte t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17e15100af7ec885.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brown wooden train track at right (B) brown wooden building at center" }, { "from": "gpt", "value": "(B) brown wooden building at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37988647cdf7c1bc.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.178, 0.381) (B) (0.524, 0.261)" }, { "from": "gpt", "value": "(B) (0.524, 0.261)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbad0de9d88c364d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue fabric tank top at center is positioned to the right of printed fabric blouse at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find blue fabric tank top at center to the right of printed fabric blouse at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddfefd606a55287d.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white fabric person at left located relative to striped sweater at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b2db1e7f40bb366.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the orange glass skyscraper at center from the following options: (A) gray concrete skyscraper at center (B) brown textured building at left (C) white textured building at center (D) dark glass skyscraper at center?" }, { "from": "gpt", "value": "(D) dark glass skyscraper at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dffad77e7b989e59.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of blue liquid water at lower left in reference to green leafy trees at left? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab3b5ba7ef4722ff.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.221, 0.969) (B) (0.895, 0.573) (C) (0.301, 0.641) (D) (0.618, 0.550)" }, { "from": "gpt", "value": "(D) (0.618, 0.550)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c108aa995a11bab9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.329, 0.447) (B) (0.256, 0.175)" }, { "from": "gpt", "value": "(A) (0.329, 0.447)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9cb06e63c4696176.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.165, 0.906) (B) (0.916, 0.917)" }, { "from": "gpt", "value": "(A) (0.165, 0.906)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88748156b5bf3d8b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) stainless steel oven at center (B) granite countertop at center (C) light wood/wooden drawer at lower left (D) wooden drawer at lower right" }, { "from": "gpt", "value": "(C) light wood/wooden drawer at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/078d708531c0d88e.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray t-shirt at center further to the viewer compared to red plastic sign at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82a3db1388007261.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.198, 0.720) (B) (0.911, 0.580)" }, { "from": "gpt", "value": "(A) (0.198, 0.720)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05e6cec85d217959.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic ring at center to the right of black glossy smartphone at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, metallic ring at center is not on the right side of black glossy smartphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d2b9dd3c7f82a99.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the white matte truck at left? (A) red snowboard at lower right (B) white matte van at center (C) white powdery snow at center" }, { "from": "gpt", "value": "(A) red snowboard at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2645c10ef4406924.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green mossy rock at center is positioned to the right of mossy rock at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find green mossy rock at center to the right of mossy rock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e776c417dde058f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown concrete river at center is positioned above brown stone tower at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05dc4a7dc4efdf23.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the gray rough rock at center? Choose among these: (A) black metal fence at left (B) white fluffy snow at center" }, { "from": "gpt", "value": "(B) white fluffy snow at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e046502c42ffdd48.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green leafy tree at upper right (B) green leafy tree at center (C) smooth bark tree at center" }, { "from": "gpt", "value": "(A) green leafy tree at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/476a241fa4ace16c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grassy field at lower center is thinner than dark brown hair at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green grassy field at lower center is not thinner than dark brown hair at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a504978d08b7a60.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) metallic gray car at lower left (B) light yellow wood porch at center" }, { "from": "gpt", "value": "(B) light yellow wood porch at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2da89a2908a465b9.jpg", "conversations": [ { "from": "human", "value": "\nIs striped shirt at lower left bigger than white cotton dress at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, striped shirt at lower left is bigger than white cotton dress at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f317d0019daaef1.jpg", "conversations": [ { "from": "human", "value": "\nDoes golden-brown bark tree at upper right appear on the left side of white paper sign at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, golden-brown bark tree at upper right is to the left of white paper sign at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86d85657169139c7.jpg", "conversations": [ { "from": "human", "value": "\nIs black fabric dress at right thinner than black paper text at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4a6887e2f7341e1.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green leafy tree at right (B) green leafy tree at left (C) green leafy tree at upper right" }, { "from": "gpt", "value": "(A) green leafy tree at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4685962110f08342.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of brown glossy horse at left and brown leather jacket at center in the image provided, where is brown glossy horse at left located with respect to brown leather jacket at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7c78f5c0093baf1.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray fabric couch at center to the right of metallic silver lamp at upper right from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, dark gray fabric couch at center is not on the right side of metallic silver lamp at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4cf644b0b9b9158.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the black matte speaker at upper right? (A) black plastic radio at upper center (B) white matte box at center" }, { "from": "gpt", "value": "(B) white matte box at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1bec7182a95dd904.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) white fleece jacket at center (B) rustic brown rifle at center" }, { "from": "gpt", "value": "(B) rustic brown rifle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1750dfff76af24b6.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of smooth concrete bridge at center in reference to white smoke at upper center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8611f02e0941a50.jpg", "conversations": [ { "from": "human", "value": "\nIs white paper at center closer to camera compared to denim jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white paper at center is in front of denim jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb91003e71a2819e.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte shirt at center thinner than white soft baby at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48262f22ec10f2f2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.603, 0.502) (B) (0.888, 0.606) (C) (0.195, 0.620)" }, { "from": "gpt", "value": "(B) (0.888, 0.606)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76cee32328b10730.jpg", "conversations": [ { "from": "human", "value": "\nDoes greenish-blue polished metal cruise ship at right appear under clear water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ce497d1658a4efc.jpg", "conversations": [ { "from": "human", "value": "\nDoes black fabric shirt at right appear under dark blue shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ff883002b8bc5d7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the suede tan blazer at left? Select from: (A) shiny black suit at center (B) satin black tie at left (C) green leafy plant at center" }, { "from": "gpt", "value": "(B) satin black tie at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b28267e0ce7d4004.jpg", "conversations": [ { "from": "human", "value": "\nDoes brick paved alley at center appear over multicolored woven rug at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba7ffd9d5562fe72.jpg", "conversations": [ { "from": "human", "value": "\nDoes purple satin blazer at center appear over matte red cardigan at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, purple satin blazer at center is not positioned above matte red cardigan at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60d6cc389da8d794.jpg", "conversations": [ { "from": "human", "value": "\nIs gravel path at center smaller than green leafy hedge at center right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, gravel path at center occupies less space than green leafy hedge at center right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/066f5338af525f94.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the matte red and white cake at center? Choose from: (A) white fondant cake at center (B) transparent glass cake stand at center (C) white glossy glass plate at center (D) transparent glass door at center" }, { "from": "gpt", "value": "(B) transparent glass cake stand at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/378cc78af07715d5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) white matte bandage at center (B) white smooth foot at upper left" }, { "from": "gpt", "value": "(A) white matte bandage at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8539632f6a13118e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange jersey at center is positioned to the left of orange fabric shorts at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, orange jersey at center is to the right of orange fabric shorts at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f0a095daf5be3b2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the smooth tan sand at center? Select from: (A) white t-shirt at upper center (B) denim pants at lower left" }, { "from": "gpt", "value": "(B) denim pants at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c87af3e36e735858.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte plastic cage at right (B) fuzzy gray rabbit at center" }, { "from": "gpt", "value": "(A) matte plastic cage at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74269de6831cfc02.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.256, 0.961) (B) (0.596, 0.567) (C) (0.798, 0.966) (D) (0.401, 0.653)" }, { "from": "gpt", "value": "(A) (0.256, 0.961)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9f09e545c5912c5.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black mandolin at center have a smaller size compared to matte wood flute at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, matte black mandolin at center might be larger than matte wood flute at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc04fa0ebd1821b8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.403, 0.294) (B) (0.623, 0.925)" }, { "from": "gpt", "value": "(B) (0.623, 0.925)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c0fc26f41f44e1b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.080, 0.350) (B) (0.813, 0.175) (C) (0.482, 0.220)" }, { "from": "gpt", "value": "(B) (0.813, 0.175)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2244de5e196ab043.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown dirt field at center is positioned to the right of white leather glove at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brown dirt field at center is to the right of white leather glove at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b5ae58f45b2aa85.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the brown stone tower at upper left? Select from: (A) white stone church at upper right (B) blue matte boat at lower right (C) dark blue water at center" }, { "from": "gpt", "value": "(C) dark blue water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a870511ba84b380.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.734, 0.647) (B) (0.698, 0.331) (C) (0.879, 0.731) (D) (0.476, 0.622)" }, { "from": "gpt", "value": "(A) (0.734, 0.647)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6981e886665532f2.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte blue jacket at center located in relation to white textured shirt at center in the image? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/550c08e47660d510.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dry skin foot at center is smaller than pale skin foot at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, dry skin foot at center has a smaller size compared to pale skin foot at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3c60fbc73525060.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.950, 0.578) (B) (0.522, 0.236)" }, { "from": "gpt", "value": "(B) (0.522, 0.236)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a61e2f399db50f7a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.770, 0.581) (B) (0.200, 0.073)" }, { "from": "gpt", "value": "(A) (0.770, 0.581)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b03d4d8937fe463.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) white stone statue at right (B) white marble statue at center, is positioned farthest from the white stone statue at left?" }, { "from": "gpt", "value": "(A) white stone statue at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13be72db5fe25add.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the black fabric at center? (A) blue knit sweater at lower left (B) black matte jacket at center" }, { "from": "gpt", "value": "(B) black matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0e9d8fba20dab5c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.231, 0.305) (B) (0.317, 0.450)" }, { "from": "gpt", "value": "(B) (0.317, 0.450)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe794f2382e0f4fa.jpg", "conversations": [ { "from": "human", "value": "\nDoes red matte tank top at center appear on the right side of black matte yoga pants at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, red matte tank top at center is positioned on the right side of black matte yoga pants at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc80d85b5faacb82.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange matte bench at center appear over orange matte tub at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, orange matte bench at center is not above orange matte tub at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1edd69ccbc5e4f8f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) tomato sauce pasta at lower right (B) striped cotton shirt at left" }, { "from": "gpt", "value": "(A) tomato sauce pasta at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05ce2c6c263b8658.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.265, 0.403) (B) (0.243, 0.069)" }, { "from": "gpt", "value": "(B) (0.243, 0.069)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/038f69576b36a7b5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white marble column at center is positioned to the left of gray stone column at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white marble column at center is to the left of gray stone column at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a00fcce4af03405e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the green glossy water at center? Choose among these: (A) green leafy tree at right (B) green leafy tree at center (C) green leafy tree at left" }, { "from": "gpt", "value": "(B) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ec57ef946975f1a.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gray suit at center below dark gray suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte gray suit at center is below dark gray suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/176541e0ea1c0641.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.399, 0.991) (B) (0.410, 0.212) (C) (0.368, 0.102) (D) (0.467, 0.078)" }, { "from": "gpt", "value": "(C) (0.368, 0.102)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15e71b34556f1853.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of white cotton shorts at center and matte white shorts at lower left in the image provided, where is white cotton shorts at center located with respect to matte white shorts at lower left? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7249e2558bf3e90b.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink fabric tank top at center appear on the left side of matte pink tank top at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, pink fabric tank top at center is to the left of matte pink tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8f87dc832a92f9e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if natural wood board at center is positioned to the left of natural wood plank at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, natural wood board at center is to the left of natural wood plank at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a01dcd27b3822a75.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.444, 0.436) (B) (0.794, 0.427)" }, { "from": "gpt", "value": "(B) (0.794, 0.427)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c962e4ad038d612a.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the metallic pole at center? Choose from: (A) brown suede shoe at lower left (B) brown suede shoe at center (C) brown leather shoes at center" }, { "from": "gpt", "value": "(A) brown suede shoe at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/768dd5d9f2cb0752.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) pink matte yoga pants at center (B) matte black tank top at center" }, { "from": "gpt", "value": "(B) matte black tank top at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1633dd5b9b6273dd.jpg", "conversations": [ { "from": "human", "value": "\nIs gray fur kangaroo at center positioned in front of gray fur kangaroo at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34cd7bc96c28432e.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of smooth red cloth at center in reference to black matte fur cat at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3868f094447b1963.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.556, 0.316) (B) (0.503, 0.278)" }, { "from": "gpt", "value": "(A) (0.556, 0.316)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a42d49a8b6769b1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.046, 0.605) (B) (0.794, 0.911)" }, { "from": "gpt", "value": "(A) (0.046, 0.605)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ee2be3fc15bf59c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) metallic red accordion at left (B) red knit sweater at center (C) blue knit sweater at left" }, { "from": "gpt", "value": "(B) red knit sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d04cd7241305c116.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white carved wood bench at upper left is wider than smooth white stool at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white carved wood bench at upper left has a greater width compared to smooth white stool at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19eeda4edee022b6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) dark gray jacket at center (B) navy blue jacket at center (C) matte beige jacket at lower left (D) green matte jacket at center" }, { "from": "gpt", "value": "(B) navy blue jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22dd7231014b5630.jpg", "conversations": [ { "from": "human", "value": "\nIs speckled orange goldfish at center below orange matte goldfish at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc7568c45779416f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if beige sand at center is thinner than white matte shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, beige sand at center might be wider than white matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1dc4ff271dcdbaae.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black fabric shirt at center is positioned to the left of black fabric jacket at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black fabric shirt at center is not on the left side of black fabric jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9b52c926285c87c.jpg", "conversations": [ { "from": "human", "value": "\nIs white powdery snow at lower center wider than beige wood sign at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0692a3520e942f83.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white matte astronaut at upper center (B) brown matte skull at center (C) black matte skull at center" }, { "from": "gpt", "value": "(A) white matte astronaut at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/592796047271e754.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) black puffy coat at center (B) striped fleece jacket at center" }, { "from": "gpt", "value": "(B) striped fleece jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3def3766cd5b1554.jpg", "conversations": [ { "from": "human", "value": "\nIs glassy reflective building at upper right wider than concrete stairs at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4599a6eed609863f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.628, 0.298) (B) (0.601, 0.617) (C) (0.115, 0.920) (D) (0.427, 0.619)" }, { "from": "gpt", "value": "(C) (0.115, 0.920)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2b075482780217c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) black puffer jacket at upper left (B) denim jacket at center (C) dark gray puffer jacket at center, is positioned farthest from the dark gray hoodie at center?" }, { "from": "gpt", "value": "(A) black puffer jacket at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/378c9288c81482c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte black coat at center (B) teal matte bicycle at center (C) brown suede boot at center" }, { "from": "gpt", "value": "(B) teal matte bicycle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f717747d744bd74.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) red cotton shirt at left (B) checkered fabric shirt at center (C) brown felt fedora at upper center" }, { "from": "gpt", "value": "(B) checkered fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e5ddcec692e0e12.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black sweater at center have a smaller size compared to white knitted sweater at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte black sweater at center is not smaller in size than white knitted sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b21aeb8ffbee483.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if skinny flesh at center is smaller than light brown wood at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/951a122793c9e153.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white glossy table at lower center (B) translucent plastic bottle at center" }, { "from": "gpt", "value": "(B) translucent plastic bottle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c56c3221c5281f50.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) tie-dye fabric shirt at center (B) matte orange t-shirt at center" }, { "from": "gpt", "value": "(B) matte orange t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33558a692789c3f1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white matte shirt at center (B) smooth bark tree trunk at left" }, { "from": "gpt", "value": "(A) white matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38da186f5477b858.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red beanie at center bigger than dry skin palm at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, matte red beanie at center might be smaller than dry skin palm at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3684140496407984.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the striped cotton pillow at upper center? Select from: (A) white fluffy cat at right (B) printed cotton baby at left" }, { "from": "gpt", "value": "(A) white fluffy cat at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/037b2391cb426064.jpg", "conversations": [ { "from": "human", "value": "\nIs suede pink yoga mat at center in front of black floral-patterned clutch at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/042dc29b00944984.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black glossy door at center is positioned below shiny red uniform at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, black glossy door at center is above shiny red uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55685f7028590507.jpg", "conversations": [ { "from": "human", "value": "\nIs gray stone church at center positioned in front of matte blue car at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d01b3bfeca3ec6b.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center to the right of white smooth waterfall at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy tree at center is to the right of white smooth waterfall at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f039c0da361923fa.jpg", "conversations": [ { "from": "human", "value": "\nDoes white and brown fur cat at center appear on the left side of fluffy brown cat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white and brown fur cat at center is not on the left side of fluffy brown cat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91ae308817b1dea2.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is yellow wooden wagon wheel at lower center located relative to yellow wood/wooden wheel at lower center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc07ee3d30820c25.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.170, 0.755) (B) (0.726, 0.819) (C) (0.715, 0.764) (D) (0.125, 0.759)" }, { "from": "gpt", "value": "(B) (0.726, 0.819)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb83e82da2fc0a19.jpg", "conversations": [ { "from": "human", "value": "\nIs clear blue water at upper left wider than orange fabric backpack at center right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, clear blue water at upper left is wider than orange fabric backpack at center right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2be406cfd361e588.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at upper center appear on the right side of white woolen goat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy tree at upper center is to the right of white woolen goat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ac781ccddef8edc7.jpg", "conversations": [ { "from": "human", "value": "\nDoes printed fabric headscarf at center appear under white paper umbrella at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, printed fabric headscarf at center is located below white paper umbrella at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73195ab99b9b9ac5.jpg", "conversations": [ { "from": "human", "value": "\nDoes white knitted shawl at center appear under red and white painted metal tower at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, white knitted shawl at center is located below red and white painted metal tower at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3af7fe7a20f21701.jpg", "conversations": [ { "from": "human", "value": "\nIs gray furry monkey at center wider than gray fur monkey at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, gray furry monkey at center has a greater width compared to gray fur monkey at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29cd97b5de31d220.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of gold/gilded wood painting at upper right in reference to orange cotton shirt at lower right? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e26fabc320c4b5da.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light blue t-shirt at center is thinner than faded denim jacket at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, light blue t-shirt at center is not thinner than faded denim jacket at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e17ee57f0e3cb8f.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte bicycle at center in front of black fabric strap at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white matte bicycle at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/708da944d9bfc98d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if concrete building at center is bigger than black glass building at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a59452497996a35.jpg", "conversations": [ { "from": "human", "value": "\nDoes white smooth concrete at center have a smaller size compared to white matte shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a7bbb329fe0b253.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.491, 0.222) (B) (0.856, 0.753)" }, { "from": "gpt", "value": "(A) (0.491, 0.222)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b98971aa3d26a46.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth stone hill at upper center thinner than brown stone town at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, smooth stone hill at upper center's width is not less than brown stone town at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b154e7f4102443f2.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.815, 0.970) (B) (0.311, 0.848)" }, { "from": "gpt", "value": "(A) (0.815, 0.970)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44bd687793905742.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the camouflage uniform at center? Choose among these: (A) black suit at left (B) camo fabric hat at right" }, { "from": "gpt", "value": "(B) camo fabric hat at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44daa6f3eda6130d.jpg", "conversations": [ { "from": "human", "value": "\nWhere is brown textured dirt at center located in relation to yellow matte trailer truck at upper right in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3c699db234ea251.jpg", "conversations": [ { "from": "human", "value": "\nIs black metallic microphone at center above silver metallic microphone at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, black metallic microphone at center is not positioned above silver metallic microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/358f53d730f2a6c9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) stone castle at center (B) green stone tower at center" }, { "from": "gpt", "value": "(A) stone castle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/888afb2b3992c975.jpg", "conversations": [ { "from": "human", "value": "\nIs brown rough tree at center above pink striped shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown rough tree at center is above pink striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/825c86da60aca17c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) blonde hair at upper center (B) orange fleece jacket at upper center" }, { "from": "gpt", "value": "(A) blonde hair at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93f938b10491a784.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.206, 0.134) (B) (0.760, 0.459) (C) (0.408, 0.522) (D) (0.397, 0.589)" }, { "from": "gpt", "value": "(C) (0.408, 0.522)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d28009d97cefc025.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if fuzzy white stuffed animal at center is positioned below bread-like at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, fuzzy white stuffed animal at center is positioned under bread-like at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b58eeacf1c66b331.jpg", "conversations": [ { "from": "human", "value": "\nIs brown wood cabin at left in front of brown wood hut at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/441df47fd8f81eac.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte water at center is positioned below smooth beige swimsuit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, black matte water at center is located below smooth beige swimsuit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02ce53a01e3615e7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) leather-like textured drum at lower right (B) blue fabric top at upper center (C) transparent glass jug at center (D) leather drum at lower right" }, { "from": "gpt", "value": "(B) blue fabric top at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f88785f3dfc82ca0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.949, 0.767) (B) (0.343, 0.936) (C) (0.874, 0.964)" }, { "from": "gpt", "value": "(A) (0.949, 0.767)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/489d69ae8fc2791f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the dark gray jacket at right? Select from: (A) dark blue jacket at left (B) black matte jacket at center" }, { "from": "gpt", "value": "(B) black matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5627f83be8f9480e.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte black backpack at center in relation to shiny red mountain bike at right? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6624ad4bd74b556d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) white cotton pillow at right (B) brown fuzzy dog at left" }, { "from": "gpt", "value": "(B) brown fuzzy dog at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c24dd3f97cad92f0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) black matte puffin at lower left (B) matte black puffin at lower left (C) white-feathered puffin at center (D) white fluffy puffin at center" }, { "from": "gpt", "value": "(C) white-feathered puffin at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2a5789aee07666d3.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green leafy willow at upper center less distant than that of black fabric jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy willow at upper center is in front of black fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/308aeab134da7e39.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.449, 0.464) (B) (0.322, 0.445)" }, { "from": "gpt", "value": "(B) (0.322, 0.445)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95664c6d08d25b4c.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the matte black tank top at left from the following options: (A) shiny blue sweater at center (B) light blue metallic guitar at right (C) matte brown ukulele at left?" }, { "from": "gpt", "value": "(C) matte brown ukulele at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6fbf6df4f578675.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.214, 0.478) (B) (0.695, 0.661) (C) (0.124, 0.839)" }, { "from": "gpt", "value": "(C) (0.124, 0.839)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adc442b15ad22ba9.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the white matte laptop at center? Choose from: (A) matte black hair at center (B) blue fabric table at center (C) silver metallic laptop at center" }, { "from": "gpt", "value": "(C) silver metallic laptop at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e633f777f537c08.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white sheer curtain at left is smaller than translucent fabric curtain at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white sheer curtain at left is not smaller in size than translucent fabric curtain at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73adfd8ab73580e5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.774, 0.444) (B) (0.348, 0.616) (C) (0.422, 0.222)" }, { "from": "gpt", "value": "(A) (0.774, 0.444)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb2289e9058e5610.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton blazer at center to the left of black textured blazer at left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white cotton blazer at center is not to the left of black textured blazer at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/627c8a1d1a7c32b8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown sandy dirt field at lower left is positioned above brown/wooden power lines at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, brown sandy dirt field at lower left is not positioned above brown/wooden power lines at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0814518546bb8d05.jpg", "conversations": [ { "from": "human", "value": "\nIs light brown woolen robe at center further to the viewer compared to yellow fabric turban at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d314a309e16af26e.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic red station wagon at right above purple fabric coat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, metallic red station wagon at right is not above purple fabric coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1fb9919d55c596a0.jpg", "conversations": [ { "from": "human", "value": "\nDoes white smooth bell tower at center appear under white stone cross at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3db6bd7fdafde800.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) khaki cotton pants at center (B) striped cotton shirt at center" }, { "from": "gpt", "value": "(A) khaki cotton pants at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c628d5ad3055812f.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte shirt at center bigger than black and white speckled feathered chicken at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, white matte shirt at center is larger in size than black and white speckled feathered chicken at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/201e27417789afc7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) brown matte shirt at lower right (B) concrete at upper center (C) dark gray suit at center" }, { "from": "gpt", "value": "(B) concrete at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf123ab960612496.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.951, 0.217) (B) (0.878, 0.614)" }, { "from": "gpt", "value": "(B) (0.878, 0.614)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38da9f342fb640c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) red dotted tie at center (B) polka dot tie at center (C) translucent glass drink at center" }, { "from": "gpt", "value": "(A) red dotted tie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25a077fc781bd353.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black harness at center lie behind blue rubber goggles at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black harness at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a285640fb01f0069.jpg", "conversations": [ { "from": "human", "value": "\nDoes thatched straw hut at right appear under blue fleece jacket at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, thatched straw hut at right is not below blue fleece jacket at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a5354d016a2b4cd.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green woven dress at center more distant than that of brown rough tree trunk at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is behind brown rough tree trunk at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/695ac09c2c769b87.jpg", "conversations": [ { "from": "human", "value": "\nIs green textured tree at center smaller than green leafy tree at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green textured tree at center is not smaller in size than green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1f3527c04554de7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) blue/yellow striped hurdle at center (B) brown glossy horse at center" }, { "from": "gpt", "value": "(B) brown glossy horse at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cae15f06f6973d5.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of silver metallic truck at right in reference to light blue metallic truck at right? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a1c045388d51e8f.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny black car at center further to camera compared to shiny red car at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of shiny red car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/822e839bde2e993f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the white matte insect at center? Choose among these: (A) translucent white insect at upper right (B) white matte insect at lower left" }, { "from": "gpt", "value": "(A) translucent white insect at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69f66a2d6cab4e56.jpg", "conversations": [ { "from": "human", "value": "\nIs glossy dark blue car at center further to camera compared to shiny black car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of shiny black car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62abc220e998a000.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green grass at center and green metallic pole at center in the image provided, where is green grass at center located with respect to green metallic pole at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f29a1a5ac8891c41.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at right to the left of clear water at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, green leafy tree at right is to the right of clear water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8519b676055aec1c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.278, 0.775) (B) (0.347, 0.667)" }, { "from": "gpt", "value": "(B) (0.347, 0.667)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4befd83205a14bfe.jpg", "conversations": [ { "from": "human", "value": "\nDoes rusty metal hut at center have a greater width compared to brown wooden fence at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of rusty metal hut at center exceeds that of brown wooden fence at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a8d754a2811a71b.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the white shirt at center? (A) light blue jeans at center (B) brown canvas bag at center" }, { "from": "gpt", "value": "(A) light blue jeans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c054db20754944d6.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton t-shirt at right further to the viewer compared to brown matte hair at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4590e061f94ee0aa.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte wood barn at right is wider than green leafy tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82b33e8bc83250bf.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the gray fabric shirt at right? (A) green plastic table at center (B) blue plaid shirt at center (C) black matte jacket at center" }, { "from": "gpt", "value": "(C) black matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95cc7cc20a8c2484.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) green ivy-covered pole at right (B) black asphalt road at center" }, { "from": "gpt", "value": "(A) green ivy-covered pole at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46f7c5d92b3952a4.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray shirt at left smaller than blue shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, dark gray shirt at left is not smaller in size than blue shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d8b648a97b80734.jpg", "conversations": [ { "from": "human", "value": "\nIs green striped pants at left positioned before brown furry boots at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9cee4aacece2f961.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green leafy palm tree at right (B) wooden bench at lower center (C) green leafy tree at left (D) green translucent water at center" }, { "from": "gpt", "value": "(A) green leafy palm tree at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8f044fda434b7d5.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green matte shirt at upper center in relation to yellow matte figure at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8022e1fdbde9735d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.193, 0.445) (B) (0.259, 0.384)" }, { "from": "gpt", "value": "(A) (0.193, 0.445)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0248a1f326924faf.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) denim pants at center (B) camouflage fabric hazmat suit at center" }, { "from": "gpt", "value": "(B) camouflage fabric hazmat suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/981947273c10c355.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte brown guitar at center have a greater width compared to denim pants at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/387009aedee2ba04.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the blue fabric shirt at center? (A) matte blue blouse at left (B) matte black shirt at upper left" }, { "from": "gpt", "value": "(A) matte blue blouse at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a45e14ad4c670b8f.jpg", "conversations": [ { "from": "human", "value": "\nIs gray matte skull at center thinner than gray fleece jacket at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d82226fc2ecb4b71.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.376, 0.681) (B) (0.234, 0.620) (C) (0.151, 0.713) (D) (0.433, 0.652)" }, { "from": "gpt", "value": "(C) (0.151, 0.713)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b840967cd7b13174.jpg", "conversations": [ { "from": "human", "value": "\nWhere is blue matte sign at left located in relation to black matte coat at lower right in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1807dbe977a8f285.jpg", "conversations": [ { "from": "human", "value": "\nDoes white bark tree trunk at center have a greater width compared to brown rough bark tree trunk at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white bark tree trunk at center's width does not surpass brown rough bark tree trunk at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b8fa5851a89b03f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.497, 0.323) (B) (0.767, 0.912)" }, { "from": "gpt", "value": "(A) (0.497, 0.323)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43c13c035fd28e4c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if bronze statue at center is positioned to the right of dark gray stone carving at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, bronze statue at center is not to the right of dark gray stone carving at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cab8ee961103da8a.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the matte black car at center? (A) matte white sign at center (B) white plastic license plate at center (C) yellow plastic license plate at center (D) shiny red car at center" }, { "from": "gpt", "value": "(A) matte white sign at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/007f06d9b2ed21bc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.389, 0.747) (B) (0.402, 0.580) (C) (0.309, 0.923)" }, { "from": "gpt", "value": "(C) (0.309, 0.923)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d884f4322e6c010.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the matte blue car at center? Choose among these: (A) matte black car at lower left (B) white plastic license plate at center" }, { "from": "gpt", "value": "(A) matte black car at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc0f381232282770.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.216, 0.541) (B) (0.093, 0.255)" }, { "from": "gpt", "value": "(B) (0.093, 0.255)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69828f6bc087f44d.jpg", "conversations": [ { "from": "human", "value": "\nDoes light blue fabric shirt at left come behind black rubber dumbbell at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b57b6ff450a0538.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray wool scarf at left is bigger than black matte jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, gray wool scarf at left is larger in size than black matte jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2086eeee8da419ac.jpg", "conversations": [ { "from": "human", "value": "\nIs silver metallic car at center above satin silver car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, silver metallic car at center is positioned over satin silver car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/798ab7cf80613a6d.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny brown bear at upper center further to the viewer compared to matte green shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/346972e28da362ea.jpg", "conversations": [ { "from": "human", "value": "\nDoes black mesh leggings at center have a larger size compared to green mesh running shoe at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black mesh leggings at center is bigger than green mesh running shoe at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3ab1f8d8d03e7e4.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green leafy tree at center located in relation to green textured tree at right in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e832f0125fc391ac.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the white fluffy lamb at center? Select from: (A) white fluffy lamb at right (B) white woolen sheep at upper left" }, { "from": "gpt", "value": "(B) white woolen sheep at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c464192ae128cf69.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) patterned fabric dress at lower center (B) green fabric dress at center (C) light brown leather jacket at center (D) light blue jeans at center" }, { "from": "gpt", "value": "(A) patterned fabric dress at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35aeb85d03015c22.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny blue bicycle at right is bigger than matte black backpack at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4df79009b2ca5a9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wet skin baby at center is smaller than glistening skin at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, wet skin baby at center is not smaller than glistening skin at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f271914e6e5afb8b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the orange fabric life jacket at center? Choose among these: (A) gray rubber tube at center (B) orange life vest at center" }, { "from": "gpt", "value": "(B) orange life vest at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf1a38f4201c2e2b.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray textured suit at center appear on the left side of black leather jacket at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, gray textured suit at center is not to the left of black leather jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5c9a943ca3f9b1b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte trees at center is smaller than green matte tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, green matte trees at center might be larger than green matte tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ff53b9014075f72.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic silver exhaust hood at upper center closer to the viewer compared to shiny plastic food at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79521941d2b83458.jpg", "conversations": [ { "from": "human", "value": "\nIs striped cotton polo shirt at center closer to camera compared to matte pink suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8214167470808436.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of pink glossy bow at upper center less distant than that of smooth plastic toy at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11a70b1dcf3e29ee.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) black matte vest at left (B) white uniform at center (C) black tactical vest at center" }, { "from": "gpt", "value": "(B) white uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/117f068bd5b4cb2f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black plastic keyboard at center is bigger than white plastic keyboard at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, black plastic keyboard at center is bigger than white plastic keyboard at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4573557c956f040.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.303, 0.716) (B) (0.065, 0.719)" }, { "from": "gpt", "value": "(A) (0.303, 0.716)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f0a5d6ac40d1364.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of glossy red train at right less distant than that of metal train track at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, glossy red train at right is in front of metal train track at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/112d5b3581a5e9d6.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the brown cotton shirt at center among (A) green matte shirt at center (B) green matte corn field at center?" }, { "from": "gpt", "value": "(A) green matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/183b3474e95bbb2a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.453, 0.278) (B) (0.459, 0.838) (C) (0.289, 0.781) (D) (0.770, 0.639)" }, { "from": "gpt", "value": "(B) (0.459, 0.838)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6a53b17b0bb0890.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the matte yellow shirt at center? Choose from: (A) silver metallic trumpet at center (B) purple fabric dress at center (C) gold shiny saxophone at center (D) black matte t-shirt at center" }, { "from": "gpt", "value": "(B) purple fabric dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba7a04482456c34f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if ruffled pink fabric skirt at center is wider than matte blue fabric skirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of ruffled pink fabric skirt at center exceeds that of matte blue fabric skirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62b5cde965933f12.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte blue uniform at center is thinner than dry matte lips at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte blue uniform at center's width is not less than dry matte lips at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95a4c7a218af0402.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black tank top at center is wider than yellow matte bicycle at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black tank top at center is wider than yellow matte bicycle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a2fc45f2fb9146e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte red baseball uniform at left is positioned above light gray fabric jacket at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte red baseball uniform at left is not positioned above light gray fabric jacket at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6119a89ad67ce4ca.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of dark gray suit at center and black checkered tie at lower right in the image provided, where is dark gray suit at center located with respect to black checkered tie at lower right? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f44cd87cf9339f28.jpg", "conversations": [ { "from": "human", "value": "\nIs polished stone column at left bigger than dark fabric at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, polished stone column at left is not bigger than dark fabric at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c9053f8125cd37e.jpg", "conversations": [ { "from": "human", "value": "\nIs white paper at center wider than black shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white paper at center is wider than black shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06cd561c61187ef6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.790, 0.473) (B) (0.030, 0.236) (C) (0.095, 0.231) (D) (0.910, 0.309)" }, { "from": "gpt", "value": "(A) (0.790, 0.473)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5f47ad749a7a018.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of green grassy track at center in reference to clear glass window at right? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f28bddccd76b0a02.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of matte silver charm at center more distant than that of pearl-like bone hand at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/645fa8218e75d9f9.jpg", "conversations": [ { "from": "human", "value": "\nIs green fabric flag at left positioned before matte black hand at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e7837f63acf6c28.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte blue shirt at center (B) gray/rough rope at center (C) matte brown backpack at right" }, { "from": "gpt", "value": "(B) gray/rough rope at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1edf6a76793426e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy palm tree at right is positioned above concrete wall at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, green leafy palm tree at right is located above concrete wall at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00a4636af1578734.jpg", "conversations": [ { "from": "human", "value": "\nIs black textured skirt at center below shiny black suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black textured skirt at center is not positioned below shiny black suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b4b68571099d347.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.672, 0.852) (B) (0.068, 0.936)" }, { "from": "gpt", "value": "(A) (0.672, 0.852)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6489f10422744bb.jpg", "conversations": [ { "from": "human", "value": "\nIs white smooth building at center to the right of woven fabric pillar at lower center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find white smooth building at center to the right of woven fabric pillar at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce5bcda227f336f6.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of matte black t-shirt at left less distant than that of black plastic glasses at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte black t-shirt at left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a243c42f8b5ec0a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.911, 0.838) (B) (0.525, 0.506) (C) (0.406, 0.588)" }, { "from": "gpt", "value": "(A) (0.911, 0.838)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e37b6e7601826ce6.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth skin hand at lower right have a greater width compared to fuzzy fur coat at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, smooth skin hand at lower right is not wider than fuzzy fur coat at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55d16a70f4dd3ff5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.215, 0.550) (B) (0.211, 0.492) (C) (0.721, 0.839)" }, { "from": "gpt", "value": "(B) (0.211, 0.492)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c55b99e15e27d61.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.406, 0.286) (B) (0.482, 0.930)" }, { "from": "gpt", "value": "(A) (0.406, 0.286)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b252006064b10e92.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy table at center have a greater width compared to black plastic microphone at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white glossy table at center is wider than black plastic microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa5496379d1a1c1a.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the green grass at lower center? Choose from: (A) brick chimney at center (B) brown brick chimney at upper right" }, { "from": "gpt", "value": "(A) brick chimney at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78f8a2f2dfd941a6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.152, 0.736) (B) (0.332, 0.589) (C) (0.835, 0.602) (D) (0.385, 0.658)" }, { "from": "gpt", "value": "(B) (0.332, 0.589)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/091120e8fedc742f.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the wooden bench at center from the following options: (A) green leafy tree at center (B) brown textured tree at upper left?" }, { "from": "gpt", "value": "(A) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5d2406d80c24453.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte tree at left is positioned below green needle-like at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green matte tree at left is located below green needle-like at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ffc5733f9bddc9b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.059, 0.642) (B) (0.841, 0.536) (C) (0.943, 0.678) (D) (0.498, 0.534)" }, { "from": "gpt", "value": "(B) (0.841, 0.536)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47bd61e47d28488d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.506, 0.084) (B) (0.917, 0.414) (C) (0.719, 0.186)" }, { "from": "gpt", "value": "(A) (0.506, 0.084)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3dbc979bd05486a6.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue water at center appear over brown textured mat at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8d79d1a06d163de.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) blue fabric tuk-tuk at center (B) black fabric bag at center (C) dark blue fabric tuk-tuk at center" }, { "from": "gpt", "value": "(A) blue fabric tuk-tuk at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afc32aa24ac2abdb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if snowy wooden hut at center is wider than yellow glass streetlight at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, snowy wooden hut at center has a greater width compared to yellow glass streetlight at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c712348b31116e7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white fluffy cloud at upper center is bigger than metallic silver car at bottom right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white fluffy cloud at upper center is bigger than metallic silver car at bottom right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e66bf679c3259d8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if navy blue fabric business suit at right is smaller than purple dotted tie at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7a3331c8c59f8e5.jpg", "conversations": [ { "from": "human", "value": "\nWhere is textured gray tarp at lower left located in relation to pink glossy tower at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42ed83be959cf6a7.jpg", "conversations": [ { "from": "human", "value": "\nIs brown plaid shirt at center wider than wooden smooth paddle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, brown plaid shirt at center is not wider than wooden smooth paddle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a104b3f62753370.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the concrete textured hole at center? (A) smooth skin face at center (B) blue matte eye at center" }, { "from": "gpt", "value": "(A) smooth skin face at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78f0bb53cd475a38.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white textured oval at center (B) white glossy fireplace at center (C) clear glass window at left" }, { "from": "gpt", "value": "(A) white textured oval at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cdaa0925c4aa09f.jpg", "conversations": [ { "from": "human", "value": "\nIs black fabric at center further to the viewer compared to light brown leather jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black fabric at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba5166d153587fa3.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte costume at center appear on the right side of velvet black dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find black matte costume at center to the right of velvet black dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58564e96858d6e1a.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center wider than matte red jersey at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of green grass at center exceeds that of matte red jersey at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16c66a63ee54f8fb.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white glossy truck at center (B) green leafy tree at lower left" }, { "from": "gpt", "value": "(A) white glossy truck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/685196ca69cd4e4f.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the red fabric flag at right among (A) red-white-striped flag at left (B) blue fabric flag at center (C) shiny black uniform at center (D) dark gray wool dress at center?" }, { "from": "gpt", "value": "(A) red-white-striped flag at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39e42b70466bcf75.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.193, 0.961) (B) (0.675, 0.473) (C) (0.742, 0.211)" }, { "from": "gpt", "value": "(B) (0.675, 0.473)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03f4db537332fe29.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red shirt at lower center further to the viewer compared to wooden chair at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte red shirt at lower center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50589c295546e429.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.842, 0.341) (B) (0.425, 0.256) (C) (0.465, 0.836)" }, { "from": "gpt", "value": "(A) (0.842, 0.341)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e562fdfe330e66a.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the amber liquid glass at lower left? Choose from: (A) gray cotton t-shirt at center (B) matte brown tank top at center (C) clear glass at lower center" }, { "from": "gpt", "value": "(B) matte brown tank top at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc5cb4af98fe82f3.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.062, 0.439) (B) (0.661, 0.786)" }, { "from": "gpt", "value": "(A) (0.062, 0.439)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49c4599c55d8c4b2.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray stone tower at upper center above smooth stone tower at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ea313cb367c600e.jpg", "conversations": [ { "from": "human", "value": "\nIs pinkish raw meat at center to the left of khaki cargo shorts at upper left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, pinkish raw meat at center is not on the left side of khaki cargo shorts at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33c50ac2eba32587.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black fabric strap at left is wider than gold chain necklace at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of black fabric strap at left exceeds that of gold chain necklace at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1f0b69e9ebbbe12.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of smooth brown tree trunk at left in relation to dirt path at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e02a08ddb9725fef.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) matte black coat at center right (B) dark gray hoodie at left (C) matte blue jacket at left" }, { "from": "gpt", "value": "(B) dark gray hoodie at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08ca5d2d8379924f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) green plastic straw at upper right (B) blue plastic cup at center (C) blue plastic cup at right (D) yellow matte table at center" }, { "from": "gpt", "value": "(D) yellow matte table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9aad8159e56ffde8.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of pink stone church at center and shiny black motorcycle at lower left in the image provided, where is pink stone church at center located with respect to shiny black motorcycle at lower left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4dea8599765849e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) black matte jacket at center (B) red fleece jacket at lower right (C) matte black jacket at center" }, { "from": "gpt", "value": "(C) matte black jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d715dabec719fdfc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.121, 0.309) (B) (0.373, 0.434)" }, { "from": "gpt", "value": "(A) (0.121, 0.309)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01f64bc2571a019a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white matte shirt at lower left (B) light blue fabric seats at lower left (C) matte gray suit at stage right (D) white shirt at lower left" }, { "from": "gpt", "value": "(A) white matte shirt at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ebcb9597649c2eb7.jpg", "conversations": [ { "from": "human", "value": "\nDoes khaki quilted jacket at right have a lesser width compared to blue matte jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91b63843ee9d766d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) blue striped shirt at center (B) red velvet santa at center" }, { "from": "gpt", "value": "(A) blue striped shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70921a4fa413237e.jpg", "conversations": [ { "from": "human", "value": "\nIs white metallic car at center below white glossy car at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white metallic car at center is below white glossy car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2ad20fed5cf928f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) rusty metal rail at center (B) blue matte sailboat at center" }, { "from": "gpt", "value": "(B) blue matte sailboat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b795033c7013d2e8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at lower left is smaller than green textured tree at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, green leafy tree at lower left occupies less space than green textured tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a465b19f32b5ffc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.073, 0.886) (B) (0.504, 0.919) (C) (0.321, 0.073)" }, { "from": "gpt", "value": "(A) (0.073, 0.886)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f39024c23741986b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the blue fabric jacket at center? Select from: (A) purple matte jacket at center (B) matte black snowboard at upper center (C) plaid fabric shirt at center" }, { "from": "gpt", "value": "(A) purple matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d288ec3514d0563.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the skinny barefoot at lower left? (A) pink flesh at center (B) matte skin toe at center" }, { "from": "gpt", "value": "(B) matte skin toe at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cdb0578d741db24.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue fabric cap at lower left is bigger than brown hair at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, blue fabric cap at lower left has a larger size compared to brown hair at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f1eaf00325883a7.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the blue fabric beach chair at right from the following options: (A) blue glossy pool at center (B) blue fabric beach chair at lower right (C) blue fabric beach chair at lower left?" }, { "from": "gpt", "value": "(B) blue fabric beach chair at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc8874162bc49ef0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.817, 0.934) (B) (0.447, 0.917) (C) (0.202, 0.795)" }, { "from": "gpt", "value": "(B) (0.447, 0.917)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/017f38077d0deb66.jpg", "conversations": [ { "from": "human", "value": "\nDoes white marble column at upper center appear on the left side of matte black shorts at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white marble column at upper center is not to the left of matte black shorts at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b27d2b54fef104a3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) golden fur dog at lower left (B) matte teal jacket at center" }, { "from": "gpt", "value": "(B) matte teal jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee951ff6d1d4ab64.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) camouflage fabric uniform at right (B) camouflage uniform at center" }, { "from": "gpt", "value": "(A) camouflage fabric uniform at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73c9e6296c463df0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the smooth concrete walkway at center? Choose among these: (A) rusty metal rail at lower right (B) dark gray pants at lower left" }, { "from": "gpt", "value": "(A) rusty metal rail at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d53193a73f8f024f.jpg", "conversations": [ { "from": "human", "value": "\nIs white marble statue at center bigger than orange plastic laptop at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white marble statue at center has a larger size compared to orange plastic laptop at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/894a59c1a52df079.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white frothy water at center is positioned to the left of green leafy tree at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white frothy water at center is not to the left of green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd69c3f2beaae4c1.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the brown matte tree trunk at center? (A) smooth gray tree trunk at center (B) smooth gray bark at center" }, { "from": "gpt", "value": "(A) smooth gray tree trunk at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46989b3825cd98cc.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the black printed umbrella at center among (A) black printed fabric umbrella at center (B) black matte umbrella at center (C) white fabric head at left (D) dark blue fabric umbrella at upper right?" }, { "from": "gpt", "value": "(A) black printed fabric umbrella at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c766a5f7cd61f93.jpg", "conversations": [ { "from": "human", "value": "\nIs green needle-like at left smaller than green forested mountain range at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, green needle-like at left occupies less space than green forested mountain range at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32137cccca8ce0bd.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green matte shirt at left (B) dark green glossy shells at center" }, { "from": "gpt", "value": "(B) dark green glossy shells at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0590d28d054f0637.jpg", "conversations": [ { "from": "human", "value": "\nIs gray rough rock at center smaller than blue water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da5b18af78826dd5.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy horse at lower right have a greater width compared to metallic silver car at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, white glossy horse at lower right might be narrower than metallic silver car at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1464594431c8eb9f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.661, 0.375) (B) (0.371, 0.591)" }, { "from": "gpt", "value": "(A) (0.661, 0.375)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bbf956ffac704100.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth sand at lower center is positioned to the right of green leafy tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, smooth sand at lower center is to the left of green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbbc445dc5bb3c7c.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of white woolen sheep at left in relation to speckled brown lamb at left? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/635b149a186d3d74.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink tulle skirt at right appear under metallic silver armor at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, pink tulle skirt at right is above metallic silver armor at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ce19c7a54211c53.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cotton kufi at center is positioned to the left of blue fabric robe at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white cotton kufi at center is not on the left side of blue fabric robe at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6eb20031faa766a2.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green fabric scarf at center located in relation to shiny brown horse at left in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b3d1cc54cd250b4.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny gold suit at center have a lesser width compared to shiny gold trench coat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e28a365df7c10144.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white floral shirt at center is positioned to the right of white lace shirt at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find white floral shirt at center to the right of white lace shirt at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be99fa3929da4022.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte shirt at center have a smaller size compared to matte yellow shirt at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b6ee7ce44ce86c0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.261, 0.394) (B) (0.503, 0.487)" }, { "from": "gpt", "value": "(A) (0.261, 0.394)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d70c5392d0c433fd.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of black plastic keyboard at left in relation to matte plastic monkey at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77b0af6365f2f50a.jpg", "conversations": [ { "from": "human", "value": "\nWhere is blue fabric jacket at center located in relation to black matte helmet at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4c737a7e787f25d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green textured tree at center (B) matte blue shirt at center (C) black metal pole at right (D) black metal pole at left" }, { "from": "gpt", "value": "(C) black metal pole at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04a899a39f5abfcd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.871, 0.630) (B) (0.477, 0.263) (C) (0.636, 0.539) (D) (0.865, 0.606)" }, { "from": "gpt", "value": "(B) (0.477, 0.263)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c55621ef95465a83.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.585, 0.853) (B) (0.451, 0.819)" }, { "from": "gpt", "value": "(B) (0.451, 0.819)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/214a40b16ae6b3c0.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center bigger than gray matte horse at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green grass at center has a larger size compared to gray matte horse at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b80d82c5f5ff256.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white silky water at left (B) smooth green water at center (C) clear water at right (D) green liquid water at center" }, { "from": "gpt", "value": "(C) clear water at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48ce98eeddca65a0.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of black matte t-shirt at center and dark blue sweater at center in the image provided, where is black matte t-shirt at center located with respect to dark blue sweater at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe8e0984fe543ab4.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center come in front of rusty metal cow at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8fe8180c9abf799.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear blue water at center appear over purple hairband at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, clear blue water at center is positioned over purple hairband at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76af876742a0fb43.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.725, 0.458) (B) (0.742, 0.986) (C) (0.640, 0.442)" }, { "from": "gpt", "value": "(C) (0.640, 0.442)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b358961e7599257a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow matte sign at center is positioned to the right of yellow plastic sign at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, yellow matte sign at center is not to the right of yellow plastic sign at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bab692ddd6da0c5.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of rustic sandstone arch at right in relation to camouflage shorts at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1bafaabd77245af6.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped cotton shirt at center appear on the left side of metallic red toy car at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, striped cotton shirt at center is not on the left side of metallic red toy car at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f4144e57a3f09fa.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.101, 0.886) (B) (0.894, 0.530)" }, { "from": "gpt", "value": "(B) (0.894, 0.530)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/034fce09536db2ba.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) blue striped shirt at center (B) purple fleece sweater at center (C) dark green sweater at upper center (D) gray wool scarf at left" }, { "from": "gpt", "value": "(C) dark green sweater at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3676bd40ce091a8a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white marble courtyard at center is positioned to the right of green leafy hedge at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white marble courtyard at center is positioned on the right side of green leafy hedge at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db86bee81bbc996f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) light blue shirt at center (B) white fabric at center (C) white clothed bishop at center" }, { "from": "gpt", "value": "(C) white clothed bishop at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a096ab15cf15790d.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green mossy tree at upper left and green mossy rock at center in the image provided, where is green mossy tree at upper left located with respect to green mossy rock at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/227648e46312c0e3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue plaid shirt at center is wider than matte blue shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, blue plaid shirt at center has a greater width compared to matte blue shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18dcf37113df75f9.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of brown rough wood at center in relation to green metallic trailer truck at upper center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1517a103b185c88c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) blue fabric neckband at left (B) golden fur dog at upper right" }, { "from": "gpt", "value": "(A) blue fabric neckband at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/59d435524e0745bf.jpg", "conversations": [ { "from": "human", "value": "\nIs brown fur deer at center positioned at the back of brown velvet antlered buck at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, brown fur deer at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef9efdb2c9f0089d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) stone church at center (B) brown textured tree at center" }, { "from": "gpt", "value": "(A) stone church at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5be2aa7e0ca42cc7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy mountain at upper left is wider than red cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf6cfa1400d2c3b5.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy hillside at center smaller than white glass building at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b29843c23b9cfe55.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.466, 0.847) (B) (0.288, 0.797) (C) (0.409, 0.863) (D) (0.299, 0.961)" }, { "from": "gpt", "value": "(A) (0.466, 0.847)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00f4703ad75f15c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.366, 0.859) (B) (0.742, 0.933)" }, { "from": "gpt", "value": "(A) (0.366, 0.859)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0db9396e72ec532.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the floral fabric saree at left? Choose among these: (A) white matte shirt at center (B) matte green bag at center" }, { "from": "gpt", "value": "(B) matte green bag at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76e669e7b33d7338.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.918, 0.613) (B) (0.885, 0.336)" }, { "from": "gpt", "value": "(B) (0.885, 0.336)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/824e6266cb4c78e8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the matte red jacket at center? Choose among these: (A) matte beige jacket at center (B) red plastic cup at lower center" }, { "from": "gpt", "value": "(B) red plastic cup at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7bf7baa5723a3391.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.196, 0.994) (B) (0.489, 0.941) (C) (0.699, 0.963) (D) (0.432, 0.973)" }, { "from": "gpt", "value": "(C) (0.699, 0.963)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46de1d4098171d54.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown wood sign at lower left is bigger than black fabric jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, brown wood sign at lower left is not bigger than black fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b0d2b536e502578.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) camouflage fabric rifle at left (B) wooden/antique brown rifle at center (C) matte black rifle at left" }, { "from": "gpt", "value": "(B) wooden/antique brown rifle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffe293a502a831ad.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) smooth concrete tower at center (B) white concrete tower at center" }, { "from": "gpt", "value": "(B) white concrete tower at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44869b8388d6c5a6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white smooth shirt at center is positioned to the left of black matte shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white smooth shirt at center is to the left of black matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad3f869ad15b0602.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black suit at center have a lesser width compared to metallic silver table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c177e2db6e76e2fe.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.526, 0.902) (B) (0.482, 0.588)" }, { "from": "gpt", "value": "(A) (0.526, 0.902)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cdb7222536e57441.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray fluffy cat at center is wider than velvet beige curtain at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of gray fluffy cat at center exceeds that of velvet beige curtain at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66a82e4a56b18dd4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white plastic sign at upper left (B) white matte sedan at right (C) red matte stop sign at upper left" }, { "from": "gpt", "value": "(A) white plastic sign at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39cc9278d7bfdd62.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) black asphalt highway at lower center (B) snowy rock mountain at center (C) white ice at center" }, { "from": "gpt", "value": "(B) snowy rock mountain at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab9e441e23e8e0d0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) green grassy field at center (B) green leafy tree at center" }, { "from": "gpt", "value": "(A) green grassy field at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2a23bebd1bc10cc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if burgundy silk tie at center is wider than matte black hand at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, burgundy silk tie at center's width does not surpass matte black hand at upper center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f16cb1a2232ad027.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton shirt at right positioned before matte striped shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is in front of matte striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3e93a65abf8fb46.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) red checkered tablecloth at center (B) white curly hair at center (C) knitted sweater santa at center" }, { "from": "gpt", "value": "(B) white curly hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b70edd53bebf8e7a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) matte blue shirt at center (B) dark brown hair at center (C) pink paper sign at center" }, { "from": "gpt", "value": "(C) pink paper sign at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e27a72ea1c8f634d.jpg", "conversations": [ { "from": "human", "value": "\nDoes dirt path at center appear over orange matte flowers at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dirt path at center is not above orange matte flowers at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9ff7e7e3664abad.jpg", "conversations": [ { "from": "human", "value": "\nIs dark blue shirt at center bigger than dark blue jeans at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, dark blue shirt at center is bigger than dark blue jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40ebff6f0ef3cbf4.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent glass door at center come in front of white matte door at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, transparent glass door at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af148f5d59d33d81.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.985, 0.922) (B) (0.103, 0.539)" }, { "from": "gpt", "value": "(A) (0.985, 0.922)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a10ea9190ad45775.jpg", "conversations": [ { "from": "human", "value": "\nDoes metallic gray winglet at upper right appear on the right side of gray metallic boat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, metallic gray winglet at upper right is to the right of gray metallic boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f87188fa275128bd.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of shiny silver sedan at center in relation to shiny silver car at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0411a4efd1f53a00.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) green leafy tree at center (B) green metallic pole at center (C) green textured tree at left (D) gray concrete sidewalk at center, is positioned farthest from the green matte tree at center?" }, { "from": "gpt", "value": "(A) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61431b6f12dea5b0.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fluffy bear cub at left come in front of white fluffy bear at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c72caf9909b857bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the brown soft hoodie at center? Choose among these: (A) light blue t-shirt at left (B) wooden paddle at center" }, { "from": "gpt", "value": "(A) light blue t-shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8543add3f741d1b8.jpg", "conversations": [ { "from": "human", "value": "\nDoes black glossy monitor at center appear under orange wood table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, black glossy monitor at center is not positioned below orange wood table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8175aa949a179c67.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) snowy white hillside at upper center (B) brown fuzzy deer at lower left (C) brown matte/deer at center (D) brown velvet antlers at upper center" }, { "from": "gpt", "value": "(D) brown velvet antlers at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1eea713628413ec4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.525, 0.481) (B) (0.425, 0.734)" }, { "from": "gpt", "value": "(B) (0.425, 0.734)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1206db1f02e4ae76.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.251, 0.662) (B) (0.388, 0.433) (C) (0.639, 0.263)" }, { "from": "gpt", "value": "(B) (0.388, 0.433)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1c85f4ad07eabc1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if stone tower at center is thinner than shiny black sedan at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, stone tower at center might be wider than shiny black sedan at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5dac217eb6bbdd0.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the clear glass window at upper center from the following options: (A) green glass window at left (B) matte black jackets at center (C) metallic silver shelf at upper right (D) white matte jacket at center?" }, { "from": "gpt", "value": "(A) green glass window at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b847c46006f71c78.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue liquid water at center have a larger size compared to white glossy ferry at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cde69737d63eefb.jpg", "conversations": [ { "from": "human", "value": "\nDoes gold metallic car at center have a lesser width compared to yellow plastic license plate at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, gold metallic car at center is thinner than yellow plastic license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8269b441f54addf4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.300, 0.992) (B) (0.438, 0.219)" }, { "from": "gpt", "value": "(A) (0.300, 0.992)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5214a5d928831c2e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.727, 0.458) (B) (0.661, 0.688)" }, { "from": "gpt", "value": "(B) (0.661, 0.688)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adf7215fdb7021cf.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the blue metallic pole at center? Select from: (A) matte blue dress at center (B) striped cotton shirt at center" }, { "from": "gpt", "value": "(A) matte blue dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c6e28e7eeae8dfa.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte gray blazer at left is wider than white matte blazer at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte gray blazer at left's width does not surpass white matte blazer at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bf8735e6733c6a0.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.140, 0.752) (B) (0.804, 0.731)" }, { "from": "gpt", "value": "(A) (0.140, 0.752)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0068e04a4b593dba.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the silvery metallic boat at lower right among (A) smooth water at lower center (B) metallic gray ship at lower right (C) white glossy boat at lower right?" }, { "from": "gpt", "value": "(C) white glossy boat at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ed3889c63304a77.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if transparent water at center is positioned above light brown fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, transparent water at center is not above light brown fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52335d97dbe1e209.jpg", "conversations": [ { "from": "human", "value": "\nDoes teal satin dress at center have a lesser width compared to white textured barong at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, teal satin dress at center is thinner than white textured barong at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88669d469d5573a5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) plaid shirt at center (B) gray matte umbrella at lower center (C) white shirt at center (D) white cotton shirt at center, is positioned farthest from the light blonde hair at center?" }, { "from": "gpt", "value": "(B) gray matte umbrella at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50763a50427e1e24.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the green leafy tree at lower left among (A) yellow metallic crane at center (B) green leafy tree at upper right?" }, { "from": "gpt", "value": "(B) green leafy tree at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02f039b794a802f0.jpg", "conversations": [ { "from": "human", "value": "\nWhere is brown wood tree at center located in relation to black fur bear at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2188e5ec679f8eb7.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.930, 0.450) (B) (0.720, 0.528) (C) (0.032, 0.838) (D) (0.385, 0.978)" }, { "from": "gpt", "value": "(B) (0.720, 0.528)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bafad17ff8ffee9.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte helmet at center in front of white matte uniform at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85296b117b70abc9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark brown leather jacket at lower left is positioned below dark gray fabric jacket at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/384d325b14faa328.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) maroon wooden table at center (B) maroon plastic scrabble board at center" }, { "from": "gpt", "value": "(B) maroon plastic scrabble board at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a66bcbac20a2c25.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the black button-up shirt at center among (A) patterned scarf at lower left (B) dark gray suit at center (C) white plastic table at lower center (D) red cotton shirt at right?" }, { "from": "gpt", "value": "(A) patterned scarf at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a096ee839b575b9.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the gray cobblestone at center among (A) shiny silver car at lower left (B) silver metallic van at lower left?" }, { "from": "gpt", "value": "(A) shiny silver car at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1016c89685bc258.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the white paper at upper right? Choose among these: (A) blue plaid shirt at lower right (B) dark brown suede jacket at left" }, { "from": "gpt", "value": "(B) dark brown suede jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae9f7c2c8b746d96.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white fleece jacket at right is positioned below gray fabric chair at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, white fleece jacket at right is above gray fabric chair at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/926ec5baabe6b6c3.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of translucent glass pitcher at center in reference to wooden tray at lower left? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25562c8127102ff1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white glossy water at center (B) shiny red car at center" }, { "from": "gpt", "value": "(A) white glossy water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02619c2146c157e2.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) black satin suit at center (B) pearl/sparkly necklace at center (C) white lace wedding dress at center" }, { "from": "gpt", "value": "(A) black satin suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56f4fb41de9f5032.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent wooden boat at center have a larger size compared to matte blue shorts at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, transparent wooden boat at center is bigger than matte blue shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/904f0394a63863c0.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte shirt at center have a larger size compared to black matte shirt at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, black matte shirt at center is larger in size than black matte shirt at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8fface8d63c3410.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) smooth skin foot at lower center (B) skin tone bare feet at center (C) light skin tone foot at lower center (D) dark brown sand at center" }, { "from": "gpt", "value": "(B) skin tone bare feet at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfe6af50f39d4918.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte orange uniform at left located in relation to black matte referee flag at left in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/944274fbb8388dee.jpg", "conversations": [ { "from": "human", "value": "\nIs glossy metallic water at center wider than silver reflective statue at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da288e3e470691a6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) matte black loincloth at center (B) brown leather drum at center (C) red striped cloth at center" }, { "from": "gpt", "value": "(A) matte black loincloth at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83cb83881aa788cc.jpg", "conversations": [ { "from": "human", "value": "\nIs frosted glass screen door at center smaller than satin glass screen door at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80093a0e6037816f.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black shirt at left below teal cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, matte black shirt at left is above teal cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f58961fc39edd171.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green textured tree at center is positioned below concrete sidewalk at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, green textured tree at center is above concrete sidewalk at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df031a711da8ef19.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the abstract painting at center? Select from: (A) plaid shirt at left (B) multicolored mosaic portrait at center" }, { "from": "gpt", "value": "(A) plaid shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3828602b85064d58.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if striped cotton shirt at center is wider than purple glittery tiara at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fe818cdf2b01a02.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) gray matte shirt at center (B) silver metallic laptop at center (C) black glossy tv at upper center" }, { "from": "gpt", "value": "(B) silver metallic laptop at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bada18472f43fc87.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.454, 0.197) (B) (0.511, 0.711) (C) (0.312, 0.230)" }, { "from": "gpt", "value": "(C) (0.312, 0.230)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f364b088e3692e35.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.340, 0.658) (B) (0.986, 0.028)" }, { "from": "gpt", "value": "(B) (0.986, 0.028)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03e5c4c72f238afb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if printed fabric basket at center is smaller than light gray shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ef23f69ab834666.jpg", "conversations": [ { "from": "human", "value": "\nIs speckled orange fish at upper left in front of white glossy fish at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5319bbfce0cd4563.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) white grass at upper center (B) green grass at lower center" }, { "from": "gpt", "value": "(B) green grass at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ded073c43e986b60.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.248, 0.287) (B) (0.262, 0.803)" }, { "from": "gpt", "value": "(B) (0.262, 0.803)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2493e5b7e12bf82.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden table at center behind matte black monitor at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of matte black monitor at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d4d057899d4b89e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte wood cabin at center (B) green shingles at upper center" }, { "from": "gpt", "value": "(A) matte wood cabin at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5840b0253932ae9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dark gray cloud at upper center (B) snowy granite mountain range at upper center" }, { "from": "gpt", "value": "(A) dark gray cloud at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f2fa9bae244f272.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte red jacket at center is bigger than matte plastic cups at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte red jacket at center is larger in size than matte plastic cups at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eaccf544c208ca10.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte shirt at center is positioned to the right of white matte tank top at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find black matte shirt at center to the right of white matte tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f4bf98c59202f8d7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if silver metallic car at center is bigger than pink matte shirt at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, silver metallic car at center is not larger than pink matte shirt at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af5dd34f9c9158a1.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white matte rail at center (B) green textured mountain at upper left" }, { "from": "gpt", "value": "(B) green textured mountain at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c588fd64d9b815e9.jpg", "conversations": [ { "from": "human", "value": "\nDoes white marble statue at center have a lesser width compared to smooth white blouse at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/197842d86d28eb1a.jpg", "conversations": [ { "from": "human", "value": "\nIs white striped shirt at left further to the viewer compared to black matte shirt at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7355cb7ee3a7901c.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white concrete blocks at lower center located relative to concrete column at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02480fd21d5638bf.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte canvas tent at left is thinner than white canvas tent at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte canvas tent at left is not thinner than white canvas tent at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5d73fbbaaf02fdd.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of white cotton shirt at center in relation to blue fleece jacket at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bcd5303f60876ce.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black laptop at center come behind silver metallic laptop at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b4a6037c198b183.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) concrete at center (B) concrete/steps at lower right (C) smooth concrete stairs at lower right" }, { "from": "gpt", "value": "(C) smooth concrete stairs at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcad8a0fd298a136.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) orange matte boat at upper right (B) white concrete dock at lower left" }, { "from": "gpt", "value": "(B) white concrete dock at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58308f23fb7da5af.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.355, 0.402) (B) (0.812, 0.577) (C) (0.597, 0.533)" }, { "from": "gpt", "value": "(A) (0.355, 0.402)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d32c1ca0615b9e1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if light brown fur at upper right is smaller than pink leather collar at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9c80bebe065c042.jpg", "conversations": [ { "from": "human", "value": "\nIs white leather jacket at center positioned before white shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1dbca56b81ef8215.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green leafy tree at center (B) green leafy tree at upper center" }, { "from": "gpt", "value": "(A) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e15d69a5ad8fa18.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the blue smooth water at lower center? Choose from: (A) gray stone wall at center (B) green leafy tree at upper center" }, { "from": "gpt", "value": "(B) green leafy tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/015a133409205a45.jpg", "conversations": [ { "from": "human", "value": "\nIs white fabric tent at upper center smaller than embroidered cotton dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, white fabric tent at upper center might be larger than embroidered cotton dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0a362abf896cb79.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) shiny glass skyscraper at right (B) reflective glass building at left" }, { "from": "gpt", "value": "(A) shiny glass skyscraper at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49f1728bd766c92b.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the black suit at center from the following options: (A) dark blue suit at center (B) black matte camera at center?" }, { "from": "gpt", "value": "(B) black matte camera at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35d57fa05747418d.jpg", "conversations": [ { "from": "human", "value": "\nDoes black robe at left have a larger size compared to white paper text at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, black robe at left is bigger than white paper text at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c88bab19e2bb6385.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) translucent glass beer at lower left (B) shiny black hat at center" }, { "from": "gpt", "value": "(B) shiny black hat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/becd45879a570e66.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) shiny glass skyscraper at left (B) silver reflective glass building at center" }, { "from": "gpt", "value": "(A) shiny glass skyscraper at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03ac6c8a0f76edd8.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of white blinds at center more distant than that of white smooth dog at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white blinds at center is further from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/343f0b2e0848f624.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray striped shirt at center is positioned above black matte tank top at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, dark gray striped shirt at center is above black matte tank top at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6169f08dab3715ea.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.516, 0.669) (B) (0.126, 0.483) (C) (0.610, 0.494)" }, { "from": "gpt", "value": "(B) (0.126, 0.483)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f21b7b2ea3426976.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy cruise ship at upper left come behind white glossy boat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is behind white glossy boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b44bf312af18e67f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.598, 0.417) (B) (0.762, 0.344)" }, { "from": "gpt", "value": "(B) (0.762, 0.344)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04b39297c4bd36fe.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at lower center is positioned to the right of wooden bench at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green grass at lower center is positioned on the right side of wooden bench at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b180f42d98eeaf74.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte food truck at center is positioned to the right of white matte truck at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, white matte food truck at center is to the left of white matte truck at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9bba69281dadda7.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of gray matte sweater at center in reference to matte black hand at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/422ee7ac9435b50c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) black matte jacket at center (B) dark brown leather coat at center" }, { "from": "gpt", "value": "(A) black matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cc03daa2200735a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white smooth dome at center is wider than green leafy tree at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48ceb525b9c3a42a.jpg", "conversations": [ { "from": "human", "value": "\nIs bare wood tree at center closer to the viewer compared to bare branches at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is behind bare branches at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/138dbaeb2a39ce78.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if rustic wood logs at center is thinner than matte black excavator at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, rustic wood logs at center's width is not less than matte black excavator at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b15794df70444bd4.jpg", "conversations": [ { "from": "human", "value": "\nDoes rough stone hillside at center have a larger size compared to snowy rock at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, rough stone hillside at center is bigger than snowy rock at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ac6925efffb82dd.jpg", "conversations": [ { "from": "human", "value": "\nDoes red fabric jacket at left come behind light blue ribbed tank top at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14df215a8e29ac42.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown speckled fur at center have a larger size compared to brown furry goat at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, brown speckled fur at center is not bigger than brown furry goat at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d1c69df05d6e25ba.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) green fabric dress at center (B) dark blue shirt at center (C) velvet black coat at center, is positioned closest to the matte black dress at center?" }, { "from": "gpt", "value": "(C) velvet black coat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e07d86b788e1ab4e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.391, 0.364) (B) (0.942, 0.787)" }, { "from": "gpt", "value": "(A) (0.391, 0.364)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41cf4dbed26dbdff.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.248, 0.495) (B) (0.112, 0.334) (C) (0.097, 0.539)" }, { "from": "gpt", "value": "(A) (0.248, 0.495)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c4bdeb9d5d6f65f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic silver bicycle at upper center is positioned to the left of shiny black shoe at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, metallic silver bicycle at upper center is to the right of shiny black shoe at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b976a7be573b515a.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) hardcover book at center (B) shiny plastic dice at center (C) matte plastic quest adventure game at center" }, { "from": "gpt", "value": "(B) shiny plastic dice at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2448f625f96a7a90.jpg", "conversations": [ { "from": "human", "value": "\nIs silhouette trees at upper center smaller than dark green leafy trees at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b6a395f0716d69e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the black cotton shirt at right? (A) gold plastic chair at center (B) light brown plastic chair at lower left (C) dark blue jeans at center (D) white plastic chair at lower left" }, { "from": "gpt", "value": "(B) light brown plastic chair at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f95c6809a2b81774.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) brown reflective water at center (B) brown stone building at center, is positioned farthest from the white marble statue at center?" }, { "from": "gpt", "value": "(A) brown reflective water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/498724cbb0169018.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.832, 0.484) (B) (0.386, 0.469)" }, { "from": "gpt", "value": "(A) (0.832, 0.484)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20dcae3a03c8702e.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray t-shirt at center to the left of light gray fabric shirt at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, dark gray t-shirt at center is not to the left of light gray fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/037433fa3873e6be.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of ripe red apple at center more distant than that of matte red apple at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68ab4518570b4ba4.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.240, 0.878) (B) (0.675, 0.944)" }, { "from": "gpt", "value": "(B) (0.675, 0.944)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d770f04adf7d64eb.jpg", "conversations": [ { "from": "human", "value": "\nDoes green textured mountain range at center have a larger size compared to green spiny cactus at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green textured mountain range at center has a larger size compared to green spiny cactus at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe21e3864ec8c715.jpg", "conversations": [ { "from": "human", "value": "\nIs green smooth water at center positioned behind brown rough rock at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green smooth water at center is in front of brown rough rock at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3cb0c11439434c34.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) polished stainless steel exhaust hood at center (B) stainless steel oven at center" }, { "from": "gpt", "value": "(A) polished stainless steel exhaust hood at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4f0391f67ba1127.jpg", "conversations": [ { "from": "human", "value": "\nDoes green mossy rock at left appear over green concrete stairs at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green mossy rock at left is positioned over green concrete stairs at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1ed7358dbb211c0.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is black leather jacket at right located relative to orange protective suit at left? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/195ad31a9a6960e8.jpg", "conversations": [ { "from": "human", "value": "\nIs white swimsuit at upper left wider than smooth skin diver at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of white swimsuit at upper left exceeds that of smooth skin diver at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f80e9f4797c32d35.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black plastic chair at lower right is smaller than dark gray jacket at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ffdad5e044fd46c.jpg", "conversations": [ { "from": "human", "value": "\nIs dead wood tree at center wider than gray textured tree trunk at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, dead wood tree at center has a greater width compared to gray textured tree trunk at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d426a64dd912efbd.jpg", "conversations": [ { "from": "human", "value": "\nIs khaki shorts at center below polka dot fabric dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, khaki shorts at center is below polka dot fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6fc7fcb085cbb79.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent plastic bubble at center appear on the left side of matte blue shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, transparent plastic bubble at center is to the right of matte blue shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78701413fa6f1ab0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.402, 0.283) (B) (0.492, 0.627)" }, { "from": "gpt", "value": "(B) (0.492, 0.627)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8307c7e8c67c9b2c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.020, 0.594) (B) (0.497, 0.628) (C) (0.698, 0.577) (D) (0.303, 0.586)" }, { "from": "gpt", "value": "(B) (0.497, 0.628)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08152bd1308f64be.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the brown fuzzy duck at lower left? Choose from: (A) brown speckled duck at left (B) speckled brown duck at center (C) white downy duck at center (D) brown fuzzy duck at center" }, { "from": "gpt", "value": "(C) white downy duck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6dbebf5209b7af36.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is clear water at lower center located relative to green leafy tree at lower center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8d084460a4d07f4.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark matte head at center located in relation to transparent glass window at left in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca5d2bb2b4fd7ae7.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of green matte shirt at upper center in reference to dark blue uniform at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b4098853173cbb7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) white cotton shirt at left (B) shiny metallic bicycle at left (C) black glossy dog at lower center (D) blue water at lower right" }, { "from": "gpt", "value": "(C) black glossy dog at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a3079f5480f271c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.961, 0.670) (B) (0.719, 0.850) (C) (0.366, 0.789)" }, { "from": "gpt", "value": "(A) (0.961, 0.670)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e287e99beca12c2.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of teal fabric jacket at center in reference to gray fleece hoodie at left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e6c2627fb72598a9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) red matte shirt at center (B) light blue shirt at center (C) green fabric purse at center (D) striped cotton shirt at left" }, { "from": "gpt", "value": "(D) striped cotton shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60d797a403299a12.jpg", "conversations": [ { "from": "human", "value": "\nIs blue wool sweater at center positioned behind black pinstripe suit at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a19ac3d9d3ed4651.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white paper at center is positioned below white shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white paper at center is not positioned below white shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/233790a994e401ed.jpg", "conversations": [ { "from": "human", "value": "\nIs beige fabric sack at center closer to the viewer compared to light blue fabric at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2fa5203f1b10dc5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) rainbow at upper center (B) clear glass window at center" }, { "from": "gpt", "value": "(A) rainbow at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96f2d9816196b504.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.589, 0.512) (B) (0.937, 0.738)" }, { "from": "gpt", "value": "(A) (0.589, 0.512)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02e1ebce2c15b57e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the matte red t-shirt at left? Select from: (A) matte black t-shirt at center (B) blue plastic toy at center (C) gray cotton shirt at right (D) matte plastic toy at center" }, { "from": "gpt", "value": "(D) matte plastic toy at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab42797a2caafa58.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.169, 0.411) (B) (0.494, 0.433)" }, { "from": "gpt", "value": "(B) (0.494, 0.433)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed6833a5a1c46620.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown hair at center further to camera compared to blonde hair at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of blonde hair at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d5c4f308b32ac12.jpg", "conversations": [ { "from": "human", "value": "\nIs clear water at center in front of dark brown leather jacket at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/990acad458db0c95.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray matte shirt at center is positioned to the right of white matte shirt at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find gray matte shirt at center to the right of white matte shirt at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6aa4dca486b5bbe.jpg", "conversations": [ { "from": "human", "value": "\nIs silver metallic minivan at right behind blue metallic sedan at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f86704b1418a1308.jpg", "conversations": [ { "from": "human", "value": "\nIs white concrete curb at upper center below smooth concrete curb at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, white concrete curb at upper center is above smooth concrete curb at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/08dff07bc7e0ecb8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) green leafy tree at left (B) green leafy tree at center (C) glistening reflective water at center (D) green leafy tree at right" }, { "from": "gpt", "value": "(B) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f7119a7912be4b1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.515, 0.475) (B) (0.619, 0.433)" }, { "from": "gpt", "value": "(B) (0.619, 0.433)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/184befd4b73ae102.jpg", "conversations": [ { "from": "human", "value": "\nIs light brown fur at center in front of fuzzy brown fox at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, light brown fur at center is behind fuzzy brown fox at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/131180f09b7d4506.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) dark brown leather jacket at upper left (B) blue metallic car at center-right" }, { "from": "gpt", "value": "(A) dark brown leather jacket at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1f7d0de1b4d85f1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark green textured pine branch at upper left is smaller than white fluffy snow at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, dark green textured pine branch at upper left might be larger than white fluffy snow at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a7515f822a6421e.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte soda bottle at center thinner than translucent glass bottle at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green matte soda bottle at center's width is not less than translucent glass bottle at right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72cc6d7697e0a319.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) brown muddy water at center (B) brown gravel path at right (C) green leafy tree at center" }, { "from": "gpt", "value": "(B) brown gravel path at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec1ac45555c0b6b5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the blue paper horse at upper left? Select from: (A) white paper horse at center (B) brown glossy horse at upper left" }, { "from": "gpt", "value": "(B) brown glossy horse at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1607f9e5e5bb6df7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.708, 0.212) (B) (0.206, 0.425) (C) (0.430, 0.189)" }, { "from": "gpt", "value": "(A) (0.708, 0.212)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aca5371d7a4504dd.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte glasses at upper left is wider than matte black glasses at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, black matte glasses at upper left is not wider than matte black glasses at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92acdd0196399ad0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) stone cherub at center (B) stone cherub at upper left (C) gray stone cherub at upper center" }, { "from": "gpt", "value": "(B) stone cherub at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b61b9844a97ae383.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the white fabric lampshade at upper center from the following options: (A) natural wood side table at center (B) white wood bookshelf at upper left (C) natural wood table at center?" }, { "from": "gpt", "value": "(A) natural wood side table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bdc500f9e90c968.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the matte black chair at lower left among (A) blue matte shirt at center (B) brown fabric chair at center (C) gray matte shirt at center?" }, { "from": "gpt", "value": "(B) brown fabric chair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1814ba68d994980a.jpg", "conversations": [ { "from": "human", "value": "\nIs velvet black jacket at left thinner than shiny dark glass at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, velvet black jacket at left might be wider than shiny dark glass at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8219eb3a3f1b7785.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the black plastic keyboard at center? Choose from: (A) white matte computer desk at center (B) matte black monitor at center" }, { "from": "gpt", "value": "(B) matte black monitor at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dba1613e98c526fc.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.941, 0.228) (B) (0.638, 0.844)" }, { "from": "gpt", "value": "(A) (0.941, 0.228)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/604acd776d1f9f79.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red dress at center appear on the right side of green textured christmas tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, matte red dress at center is positioned on the right side of green textured christmas tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05eb317948f68257.jpg", "conversations": [ { "from": "human", "value": "\nIs black textured coat at center closer to the viewer compared to black woolen coat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3a368bfff5c9630.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if fluffy white teddy bear at upper left is bigger than white plush bear at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, fluffy white teddy bear at upper left has a larger size compared to white plush bear at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/170ba49fa36d6af2.jpg", "conversations": [ { "from": "human", "value": "\nDoes textured fabric heart at center have a smaller size compared to polished bronze statue at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, textured fabric heart at center is not smaller in size than polished bronze statue at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a4b130eed019aa6.jpg", "conversations": [ { "from": "human", "value": "\nIs gray concrete wall at left to the left of white matte shirt at lower center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, gray concrete wall at left is to the left of white matte shirt at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d4fdc7c6a0a87d1.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.654, 0.795) (B) (0.028, 0.806) (C) (0.315, 0.970) (D) (0.076, 0.406)" }, { "from": "gpt", "value": "(D) (0.076, 0.406)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7eb7cc432df77387.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the white shirt at upper right among (A) light brown acoustic guitar at center (B) matte white hat at center (C) red cotton shirt at center (D) white matte hat at upper center?" }, { "from": "gpt", "value": "(D) white matte hat at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/757f2c3713f49003.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the black matte speaker at center? (A) smooth white shirt at lower left (B) matte brown jacket at center (C) smooth blue shirt at lower left" }, { "from": "gpt", "value": "(A) smooth white shirt at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/253fbb1d075df095.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.305, 0.720) (B) (0.523, 0.277)" }, { "from": "gpt", "value": "(B) (0.523, 0.277)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/363168e2160947f5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy ivy at center is positioned to the right of white stone balcony at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green leafy ivy at center is not to the right of white stone balcony at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/635ed476ff2dfbf6.jpg", "conversations": [ { "from": "human", "value": "\nDoes black fleece jacket at lower left appear under black fleece sweatshirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, black fleece jacket at lower left is located below black fleece sweatshirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db811ebc9775464f.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown building at center to the right of blue water at left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find matte brown building at center to the right of blue water at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dea0e1cd89a20eeb.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte pot at center closer to the viewer compared to rusty metal pot at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85d198e3fdcc21e4.jpg", "conversations": [ { "from": "human", "value": "\nIs silver glass skyscraper at right to the left of white stone tower at left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, silver glass skyscraper at right is not to the left of white stone tower at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5f1bdbe6f94c298.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of green matte container ship at center in reference to transparent water at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d4b94560c0d0c5c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.508, 0.164) (B) (0.286, 0.163)" }, { "from": "gpt", "value": "(A) (0.508, 0.164)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/816825c607a6029b.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of white matte shirt at center less distant than that of black matte shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0cb3a71f2b1c957.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of white knitted scarf at center in relation to gold ornate frame at upper left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/630616ea082de770.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center appear under peeling white wood door at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, green leafy tree at center is above peeling white wood door at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da45fa6b73f35b67.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte window at center further to the viewer compared to white matte shutter at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d1d5857d76088c0.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the camo fabric shirt at left? Choose from: (A) printed fabric skirt at left (B) dark red textured pants at right" }, { "from": "gpt", "value": "(A) printed fabric skirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/704805f16ccb1c27.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.447, 0.566) (B) (0.829, 0.834)" }, { "from": "gpt", "value": "(B) (0.829, 0.834)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e4607fd28087894.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) black fabric at lower center (B) matte floral dress at center" }, { "from": "gpt", "value": "(A) black fabric at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67c78c5b1c994681.jpg", "conversations": [ { "from": "human", "value": "\nIs blue paper poster at center further to the viewer compared to matte white shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de9b23e8aac3c925.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if leather shoe at center is thinner than purple knitted sock at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, leather shoe at center might be wider than purple knitted sock at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85312c5a8bf23710.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown matte cup at center appear on the right side of dark brown syrup at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, dark brown matte cup at center is to the right of dark brown syrup at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/095b2af602947787.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black dress at center bigger than white shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0208031dda5a2e83.jpg", "conversations": [ { "from": "human", "value": "\nIs clear acrylic robot at center thinner than black rubber wheel at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, clear acrylic robot at center's width is not less than black rubber wheel at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8f5efba63909f11.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the dark stone archway at center? Choose from: (A) red fabric flag at center (B) light beige stone tower at left (C) stone tower at center" }, { "from": "gpt", "value": "(A) red fabric flag at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76a73e39c1dabbf7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if orange fleece sweatshirt at center is positioned below orange fabric swivel chair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, orange fleece sweatshirt at center is not below orange fabric swivel chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f568fd2b5481d3e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.030, 0.547) (B) (0.617, 0.203) (C) (0.231, 0.684) (D) (0.242, 0.953)" }, { "from": "gpt", "value": "(B) (0.617, 0.203)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db4bab184a6336e2.jpg", "conversations": [ { "from": "human", "value": "\nDoes white paperboard at center appear over silver metallic tripod at center-left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f65ff2cd7435bfc6.jpg", "conversations": [ { "from": "human", "value": "\nIs brown textured dress at center smaller than matte red dress at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, brown textured dress at center is not smaller in size than matte red dress at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bad5bb44098b29e6.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray wool scarf at center lie in front of striped fabric shirt at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of striped fabric shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46e2fb8770ab267b.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic gold sunglasses at center above black matte sunglasses at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, metallic gold sunglasses at center is not above black matte sunglasses at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/326c9721446dafb0.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown hoodie at center above brown soft sweater at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, matte brown hoodie at center is below brown soft sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6af5912e0a3bd526.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.196, 0.659) (B) (0.296, 0.562) (C) (0.364, 0.397)" }, { "from": "gpt", "value": "(C) (0.364, 0.397)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b94756d8a87b1b95.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.035, 0.752) (B) (0.579, 0.553)" }, { "from": "gpt", "value": "(B) (0.579, 0.553)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/415e7c85d05fbe3d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.268, 0.164) (B) (0.302, 0.805)" }, { "from": "gpt", "value": "(B) (0.302, 0.805)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/185968d1a9589038.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte headscarf at center to the left of smooth skin hand at right from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, black matte headscarf at center is positioned on the left side of smooth skin hand at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b42ac288937c5ac8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.730, 0.755) (B) (0.251, 0.706) (C) (0.296, 0.583)" }, { "from": "gpt", "value": "(B) (0.251, 0.706)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6226c3f7e727fa76.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte chef hat at upper center thinner than white matte plate at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white matte chef hat at upper center's width is not less than white matte plate at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b3b8ccce590ca64.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of brown rough skin at center and brown rough branch at upper center in the image provided, where is brown rough skin at center located with respect to brown rough branch at upper center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fca77fa0a732faf0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte black table at lower left (B) translucent plastic cup at center (C) dark blue shirt at left" }, { "from": "gpt", "value": "(B) translucent plastic cup at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/952a3c53b18e4863.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton shirt at center wider than green grassy bank at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbea5d7c77312546.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny metallic jacket at center appear under shiny metallic food at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, shiny metallic jacket at center is not below shiny metallic food at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d619147bb2beecc.jpg", "conversations": [ { "from": "human", "value": "\nDoes beige stone building at center have a lesser width compared to beige concrete building at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, beige stone building at center is not thinner than beige concrete building at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5f75c9474cfdd15.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte clock at upper center appear on the right side of white glossy clock at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, green matte clock at upper center is not on the right side of white glossy clock at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec5266361debad7f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) glossy black latex at center (B) shiny black leather pants at center (C) matte black boxing glove at center" }, { "from": "gpt", "value": "(C) matte black boxing glove at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e21d2736855ae05.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy boat at center is positioned above white plastic boat at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white glossy boat at center is not above white plastic boat at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c5778fa6952e1d4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) smooth black suit at right (B) matte black suit at center (C) matte pink shirt at center (D) shiny red tie at center" }, { "from": "gpt", "value": "(C) matte pink shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/223b56df1a79013a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) vibrant pink shorts at center (B) matte blue shirt at left" }, { "from": "gpt", "value": "(A) vibrant pink shorts at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f1a5e4b3b92ea11.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is clear glass window at lower right located relative to transparent glass window at lower left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bafde96299eb7318.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte ballerina at center closer to camera compared to matte black leotard at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34599b4b752d0c24.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the clear glass mirror at upper center from the following options: (A) white glossy sink at lower center (B) matte black t-shirt at center?" }, { "from": "gpt", "value": "(A) white glossy sink at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3a1c014f5dd10a2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.481, 0.531) (B) (0.865, 0.395) (C) (0.775, 0.914)" }, { "from": "gpt", "value": "(C) (0.775, 0.914)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c0cbf09d6d30c37.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the light beige fabric headscarf at upper left? Select from: (A) white cotton shirt at center (B) white dotted fabric pants at lower left (C) soft gray fabric baby at center (D) orange fabric sandal at lower left" }, { "from": "gpt", "value": "(A) white cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e9eb1710265015a.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of black paper sign at upper center more distant than that of brown curly hair at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black paper sign at upper center is behind brown curly hair at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/882bd40efd8c3052.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white frothy water at center is thinner than stone bridge at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, white frothy water at center's width is less than stone bridge at upper center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/def2958bd2b9383b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte black shirt at center (B) gray fleece at right (C) white leather hand at center" }, { "from": "gpt", "value": "(C) white leather hand at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/967f584691dd2223.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the gold bangles at left? Choose among these: (A) leather bracelet at left (B) orange-brown fur tiger at center" }, { "from": "gpt", "value": "(B) orange-brown fur tiger at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51a8b10afadcae26.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) rusty metal barn at center (B) dry grass at center" }, { "from": "gpt", "value": "(B) dry grass at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9acd942c345e7af.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.708, 0.688) (B) (0.429, 0.627) (C) (0.967, 0.645)" }, { "from": "gpt", "value": "(A) (0.708, 0.688)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9c790425d9cb7a4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) black textured portrait at upper center (B) grungy paper poster at center" }, { "from": "gpt", "value": "(B) grungy paper poster at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16139ad1496d7889.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of striped cotton shirt at center and matte gray shirt at lower right in the image provided, where is striped cotton shirt at center located with respect to matte gray shirt at lower right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37b880d5ae59ea3d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the smooth wooden table at center? Choose among these: (A) dark brown leather jacket at center (B) yellow matte shirt at left" }, { "from": "gpt", "value": "(A) dark brown leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7e2da8ec4ca6957.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown matte fungi at center appear over brown fuzzy mushroom at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, brown matte fungi at center is located above brown fuzzy mushroom at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4c136308e80152a.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of white matte tissue box at center in relation to white matte moisturizer at center right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/299b1521f8cb6588.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.178, 0.645) (B) (0.796, 0.691) (C) (0.468, 0.877)" }, { "from": "gpt", "value": "(A) (0.178, 0.645)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/078a4203f3364b06.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the dark gray sweater at center? Select from: (A) matte black car at lower left (B) white matte awning at lower right" }, { "from": "gpt", "value": "(A) matte black car at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef255bea19e59651.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) matte blue shirt at center (B) denim shirt at center (C) blue fabric hairband at lower right" }, { "from": "gpt", "value": "(C) blue fabric hairband at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb7a85dbb36a14d4.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.215, 0.398) (B) (0.511, 0.480) (C) (0.918, 0.303) (D) (0.465, 0.344)" }, { "from": "gpt", "value": "(A) (0.215, 0.398)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6808a98ea3289c3.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) white matte projection screen at upper center (B) purple floral blouse at center, is positioned closest to the gray cotton t-shirt at left?" }, { "from": "gpt", "value": "(B) purple floral blouse at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e8d07a5431abb67.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark gray stone ledge at right located in relation to green dome building at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/571779bf7035d00f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at left is positioned to the right of matte brown hat at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green leafy tree at left is not to the right of matte brown hat at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36e12147efde9f73.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) black plastic sunglasses at center (B) white plastic man at center" }, { "from": "gpt", "value": "(B) white plastic man at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0cae66991219f6e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte black figure at center (B) wooden post at center (C) smooth black hair at center" }, { "from": "gpt", "value": "(C) smooth black hair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19d2d02089ecf1ea.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green matte shirt at center located in relation to matte red polo shirt at right in the image? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a5429afc460f2e5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte red jacket at right is thinner than brushed nylon jacket at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, matte red jacket at right has a lesser width compared to brushed nylon jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45fdabc018f08566.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.562, 0.161) (B) (0.229, 0.786)" }, { "from": "gpt", "value": "(B) (0.229, 0.786)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25c6d10d7f71c670.jpg", "conversations": [ { "from": "human", "value": "\nIs brown leather accordion at center further to the viewer compared to wooden floral-patterned accordion at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, brown leather accordion at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/643b33dd7b0bb150.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is black matte shirt at center located relative to white matte bowl at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f35796b752b188bc.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.102, 0.378) (B) (0.724, 0.364)" }, { "from": "gpt", "value": "(A) (0.102, 0.378)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24b96b1f458c472e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.348, 0.780) (B) (0.645, 0.742) (C) (0.639, 0.848)" }, { "from": "gpt", "value": "(A) (0.348, 0.780)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b142fee52b4bed14.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the smooth skin face at lower left? (A) white cotton shirt at upper center (B) orange striped fur tiger at center" }, { "from": "gpt", "value": "(A) white cotton shirt at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c075bfd32f0b960.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) pink fabric at center (B) dirt path at center" }, { "from": "gpt", "value": "(A) pink fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0eac836953fa495.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) polka dot fabric pants at right (B) metallic silver bowl at center" }, { "from": "gpt", "value": "(A) polka dot fabric pants at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcfafac7a6d31a2d.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the gray striped shirt at center from the following options: (A) brown hair at lower center (B) metallic silver microphone at upper right (C) black metallic microphone at right (D) blonde hair at lower right?" }, { "from": "gpt", "value": "(A) brown hair at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e922efa938bdc1c1.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.467, 0.470) (B) (0.363, 0.458)" }, { "from": "gpt", "value": "(B) (0.363, 0.458)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f8b077f2470066f.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the blue cotton shirt at center? (A) matte white shirt at center (B) striped fabric ball at center" }, { "from": "gpt", "value": "(B) striped fabric ball at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f1c37ef248e8738.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue striped shirt at right appear over white striped shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, blue striped shirt at right is not positioned above white striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/627bb1b7195001da.jpg", "conversations": [ { "from": "human", "value": "\nIs green mossy hedge at upper left to the right of green leafy hedge at upper center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, green mossy hedge at upper left is to the left of green leafy hedge at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29717711fc54bb1a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown fur raccoon at center is thinner than green matte snake at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, brown fur raccoon at center's width is not less than green matte snake at lower left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e78ac031a06802e0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) blonde hair at upper right (B) black matte shirt at center" }, { "from": "gpt", "value": "(A) blonde hair at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a31e7bcf59690b89.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) gray concrete pavement at center (B) green leafy tree at upper left (C) brown/dry leaves at upper center, is positioned farthest from the gray concrete block at left?" }, { "from": "gpt", "value": "(B) green leafy tree at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41aad67da9212d64.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) glossy black sedan at center (B) gray concrete curb at lower left (C) white plastic license plate at center" }, { "from": "gpt", "value": "(C) white plastic license plate at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e2f20171f542d8d.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy palm tree at lower right have a larger size compared to green leafy palm tree at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d35cd50f396deda.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow rubber ball at right positioned in front of yellow plastic bear at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4306643c48734385.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) black plastic clock at center (B) black matte bicycle handlebars at lower right (C) matte black text at left" }, { "from": "gpt", "value": "(B) black matte bicycle handlebars at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c342499c41bf6970.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.087, 0.722) (B) (0.791, 0.237) (C) (0.518, 0.855)" }, { "from": "gpt", "value": "(B) (0.791, 0.237)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e58fe2efc7d1e587.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) white glossy pillar at center (B) white metallic pillar at center" }, { "from": "gpt", "value": "(B) white metallic pillar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf25a122a94101d3.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of american flag at upper right in reference to polyester flag at upper center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b61f60a6508f18d8.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of black polished wood ship at center in relation to white matte sailboat at right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4c97e4735e3b46a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.266, 0.811) (B) (0.293, 0.872) (C) (0.983, 0.847) (D) (0.611, 0.745)" }, { "from": "gpt", "value": "(A) (0.266, 0.811)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41b1f7c1fa6944c8.jpg", "conversations": [ { "from": "human", "value": "\nDoes green metallic sign at left have a larger size compared to black metal sign at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green metallic sign at left is bigger than black metal sign at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec84928a07be3ba9.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of blue printed shorts at upper left and smooth skin torso at upper left in the image provided, where is blue printed shorts at upper left located with respect to smooth skin torso at upper left? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4934bb909f3614da.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) white wrought iron balcony at center (B) brown muddy water at lower left" }, { "from": "gpt", "value": "(A) white wrought iron balcony at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca86f6d3839995f3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) green leafy tree at left (B) green leafy tree at center (C) clear water at center" }, { "from": "gpt", "value": "(B) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1afdcc27f4271c9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.847, 0.573) (B) (0.991, 0.566)" }, { "from": "gpt", "value": "(B) (0.991, 0.566)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3464c5310670540.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white paper at lower right is positioned above metallic red pen at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white paper at lower right is positioned over metallic red pen at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3de0b3e0d4bca077.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the blue fabric shirt at left? Choose among these: (A) dark blue shirt at center (B) dark gray jacket at left" }, { "from": "gpt", "value": "(A) dark blue shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0c30c6865ebd7e8.jpg", "conversations": [ { "from": "human", "value": "\nIs dark green fabric curtain at upper left positioned behind white paper calendar at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dark green fabric curtain at upper left is in front of white paper calendar at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4907f30ced4a9db.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) multicolored fabric crowd at lower center (B) brown fabric pants at center" }, { "from": "gpt", "value": "(B) brown fabric pants at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/116cd5bf6347d869.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of gray wool coat at left in relation to brown matte jacket at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf0d94fbede6e0c9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.831, 0.939) (B) (0.598, 0.617)" }, { "from": "gpt", "value": "(B) (0.598, 0.617)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9312ccb5052dad36.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white snow at center is thinner than brown/rough tree at center-left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white snow at center's width is not less than brown/rough tree at center-left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c25bd3251e871209.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if concrete stairs at center is thinner than wooden bench at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c299bedb7e4e2312.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue water at lower center is smaller than brown sandy shoreline at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, blue water at lower center occupies less space than brown sandy shoreline at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/634b1f525d704f81.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear water splash at center appear under matte skin man at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, clear water splash at center is not below matte skin man at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02279aba7e6bc46a.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown hair at upper center closer to camera compared to brown matte eye at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, dark brown hair at upper center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c6ee9b863cbcd13.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray stone clock tower at center is positioned to the right of green leafy tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, gray stone clock tower at center is to the right of green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a90bceeec020bb3a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.926, 0.475) (B) (0.347, 0.752)" }, { "from": "gpt", "value": "(A) (0.926, 0.475)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54162ff1fa1be608.jpg", "conversations": [ { "from": "human", "value": "\nIs brown stone palace at center smaller than green leafy tree at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, brown stone palace at center occupies less space than green leafy tree at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5963a790f277e62c.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gray sedan at right further to camera compared to yellow metallic taxi at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of yellow metallic taxi at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bffbe9d87882cf68.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy shirt at center thinner than matte black blazer at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white glossy shirt at center is not thinner than matte black blazer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd2f941b11889d8c.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grassy hillside at upper center have a lesser width compared to white matte boat at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green grassy hillside at upper center is not thinner than white matte boat at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/edeb0186583f7795.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown leather shoe at center appear under matte brown shoe at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec54aa9493772864.jpg", "conversations": [ { "from": "human", "value": "\nDoes khaki fabric cap at right appear on the right side of beige fabric cap at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, khaki fabric cap at right is not to the right of beige fabric cap at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5506dcf92d365df.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.966, 0.539) (B) (0.689, 0.713) (C) (0.319, 0.327)" }, { "from": "gpt", "value": "(A) (0.966, 0.539)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ca17b18f066c16e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green metallic train at center is thinner than metallic gray tower at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green metallic train at center's width is less than metallic gray tower at upper center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a0804bac27c17e6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black camo shorts at lower left is positioned to the right of green matte shirt at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, black camo shorts at lower left is to the left of green matte shirt at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b50bdfb7b93487f0.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of polished brass bell tower at upper center in relation to blue painted metal clock at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/720a50cadd6c0290.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the dry skin at center? Choose among these: (A) pale skin foot at center (B) dry skin toe at center" }, { "from": "gpt", "value": "(B) dry skin toe at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afd770cbe186e0fa.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at left appear on the left side of green leafy tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green leafy tree at left is positioned on the left side of green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37fc626df6ea4e00.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) orange matte shorts at right (B) orange matte soccer jersey at center" }, { "from": "gpt", "value": "(B) orange matte soccer jersey at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bf9882012185bf1.jpg", "conversations": [ { "from": "human", "value": "\nIs fuzzy grass at center to the left of smooth gray stone bench at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find fuzzy grass at center to the left of smooth gray stone bench at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/916e0f44d8444527.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.422, 0.198) (B) (0.187, 0.825)" }, { "from": "gpt", "value": "(B) (0.187, 0.825)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e38a38280c13eba.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the matte red dress at left? Choose from: (A) orange cotton shirt at center (B) silky satin dress at center (C) matte pink fabric dress at center" }, { "from": "gpt", "value": "(B) silky satin dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cccb9cb4ae88951.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the black plastic table at center? (A) black matte laptop at center (B) black fabric skirt at center (C) black suit at left" }, { "from": "gpt", "value": "(A) black matte laptop at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e00a917ab0c4bf3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.421, 0.516) (B) (0.184, 0.559) (C) (0.153, 0.897)" }, { "from": "gpt", "value": "(B) (0.184, 0.559)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c15c04ee4d342c76.jpg", "conversations": [ { "from": "human", "value": "\nDoes green fabric apron at center appear under orange shirt at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5715441207e3757.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is light beige pants at center located relative to white striped shirt at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/351d887bba4e88e3.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center behind green liquid at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4543f3f413b13727.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte bicycle at lower right further to the viewer compared to green apron at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of green apron at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bfab19045dbcaca.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the white shirt at center? Choose from: (A) yellow paper at upper center (B) white cotton shirt at center (C) matte paper poster at left (D) black suit at left" }, { "from": "gpt", "value": "(C) matte paper poster at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44b82495ab7a1c74.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green matte tree at center in relation to clear water at lower left? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcdb162f8431a9b4.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the yellow-green foliage at center from the following options: (A) brown/dried wood tree at right (B) green needle-like at center?" }, { "from": "gpt", "value": "(B) green needle-like at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9320aa9c287009a0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte white shirt at center (B) black matte cape at center" }, { "from": "gpt", "value": "(A) matte white shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9df0fc36f9bbda00.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the matte gray tent at center? Choose from: (A) blue fabric shorts at lower left (B) matte pink tent at center (C) yellow fabric tent at right" }, { "from": "gpt", "value": "(C) yellow fabric tent at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae8ec45d398fd7da.jpg", "conversations": [ { "from": "human", "value": "\nDoes black fabric shirt at center have a lesser width compared to white plastic table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, black fabric shirt at center has a lesser width compared to white plastic table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25f93829d856d4fa.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.525, 0.469) (B) (0.604, 0.533)" }, { "from": "gpt", "value": "(B) (0.604, 0.533)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0034dff0499938b0.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth bark tree trunk at center appear under smooth gray bark at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, smooth bark tree trunk at center is located below smooth gray bark at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4380c6891a0a7bd0.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the orange clay tiles at upper center? Choose from: (A) light brown stone tower at center (B) metallic spire at upper center" }, { "from": "gpt", "value": "(B) metallic spire at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2d9de9191eca8b0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.816, 0.219) (B) (0.531, 0.570) (C) (0.503, 0.452) (D) (0.081, 0.641)" }, { "from": "gpt", "value": "(C) (0.503, 0.452)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/005b9630718c06c7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte jacket at center is positioned above brown fuzzy jacket at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/babb1c96182fc740.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.273, 0.991) (B) (0.502, 0.702)" }, { "from": "gpt", "value": "(A) (0.273, 0.991)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d42d55e2b1abfef.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green textured pine tree at center (B) brown leafy tree at left" }, { "from": "gpt", "value": "(B) brown leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/057b9b1240b54362.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue matte jacket at center have a lesser width compared to blue reflective sunglasses at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, blue matte jacket at center might be wider than blue reflective sunglasses at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9a6aaae1b2b166c.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte gray shirt at center appear under green matte mustache at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3c587ae8efcb7c8.jpg", "conversations": [ { "from": "human", "value": "\nDoes red/yellow fabric canopy at upper center appear over smooth glossy table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, red/yellow fabric canopy at upper center is positioned over smooth glossy table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4418d82341566cc8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.392, 0.977) (B) (0.297, 0.761)" }, { "from": "gpt", "value": "(B) (0.297, 0.761)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16dd88916947362b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue puffer vest at center is positioned below matte black shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/137b3e56ed952e9c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) white snow-covered mountain at center (B) white paper cup at lower left" }, { "from": "gpt", "value": "(B) white paper cup at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e37f20f8c0d5cea.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black matte shirt at center located in relation to matte black shirt at lower center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b6328cd3b6c273da.jpg", "conversations": [ { "from": "human", "value": "\nDoes checkered wool jacket at center have a smaller size compared to black cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, checkered wool jacket at center is not smaller in size than black cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/faa044d38a4c08fc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) cloudy sky at upper center (B) smooth green mountains at center" }, { "from": "gpt", "value": "(A) cloudy sky at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab3c07d06030e0ef.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) blue fabric table at lower left (B) light blue striped shirt at center (C) white fabric table at lower left" }, { "from": "gpt", "value": "(B) light blue striped shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a395f92f523e1093.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown spiky hair at upper center closer to camera compared to rubberized red goggles at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49d660c59cb4bb7a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.570, 0.914) (B) (0.322, 0.900)" }, { "from": "gpt", "value": "(B) (0.322, 0.900)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0022e09775235001.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.415, 0.434) (B) (0.006, 0.703) (C) (0.656, 0.161) (D) (0.340, 0.512)" }, { "from": "gpt", "value": "(B) (0.006, 0.703)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ac17cbb3cc3362d.jpg", "conversations": [ { "from": "human", "value": "\nIs silvery metallic fish at center wider than translucent white fish at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, silvery metallic fish at center is not wider than translucent white fish at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11af667fc0942614.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) brown wooden cabin at center (B) mahogany wood rocking chair at center" }, { "from": "gpt", "value": "(A) brown wooden cabin at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8cd5ba67b3be2a10.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) silver metallic car at center (B) green leafy tree at center" }, { "from": "gpt", "value": "(A) silver metallic car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6444d3f56590b15.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) smooth red tablecloth at center (B) red fabric tablecloth at left (C) matte plastic posters at left" }, { "from": "gpt", "value": "(A) smooth red tablecloth at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/595a738d1a75ebe1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white fabric couch at lower center is wider than white matte lamp at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3816953f8979fa69.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) metallic blue truck at right (B) translucent glass bottle at lower left" }, { "from": "gpt", "value": "(A) metallic blue truck at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/541818e5a5d699a5.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte shirt at center bigger than pink cotton shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black matte shirt at center is bigger than pink cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3ff4d6124fd95a0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) wooden basketball court at center (B) striped fabric referee at left" }, { "from": "gpt", "value": "(A) wooden basketball court at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7671858cbb99d22f.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of light blue matte car at center and black plastic license plate at center in the image provided, where is light blue matte car at center located with respect to black plastic license plate at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4a1a7b6c17735cf.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth black sweater at center appear over smooth skin hand at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcf0f91f13f5addb.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth red radish at left below silver textured spoon at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/939d2ba19ba1bd5e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) blue glossy monitor at lower center (B) matte red dress at center" }, { "from": "gpt", "value": "(B) matte red dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86448bfe23ed5ed8.jpg", "conversations": [ { "from": "human", "value": "\nIs white powdery snow at center to the left of gray fuzzy mule at left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white powdery snow at center is not to the left of gray fuzzy mule at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a20c50538813ed4.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy hot tub at center appear on the left side of white matte bikini top at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white glossy hot tub at center is not on the left side of white matte bikini top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e690b3dd0afcb23.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.634, 0.006) (B) (0.936, 0.872) (C) (0.719, 0.125) (D) (0.515, 0.506)" }, { "from": "gpt", "value": "(C) (0.719, 0.125)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fccaa090fcd10d57.jpg", "conversations": [ { "from": "human", "value": "\nDoes bare branches at right have a smaller size compared to silver metallic car at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, bare branches at right might be larger than silver metallic car at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8c955af2c5a7372.jpg", "conversations": [ { "from": "human", "value": "\nIs blue cotton shirt at center further to the viewer compared to matte black shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e1f4a4ed1c92f12.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.147, 0.627) (B) (0.655, 0.409) (C) (0.508, 0.567)" }, { "from": "gpt", "value": "(B) (0.655, 0.409)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ced38bd25223d74c.jpg", "conversations": [ { "from": "human", "value": "\nIs bronze statue at center thinner than white textured wing at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, bronze statue at center might be wider than white textured wing at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df88fc70fae928e5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the smooth metal train track at center? Choose among these: (A) smooth steel tracks at center (B) black matte traffic light at upper center (C) metal/yellow/black sign at left (D) metallic pink train car at center" }, { "from": "gpt", "value": "(D) metallic pink train car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ed9f14d297b86eb.jpg", "conversations": [ { "from": "human", "value": "\nDoes lavender fabric shirt at center have a smaller size compared to white shirt at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7f2e5e93c3a9682.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.564, 0.836) (B) (0.398, 0.927) (C) (0.165, 0.531) (D) (0.921, 0.655)" }, { "from": "gpt", "value": "(A) (0.564, 0.836)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe92eb70e9390621.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of black plastic computer at bottom more distant than that of black plastic mouse at bottom right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black plastic computer at bottom is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df4d504c321cf629.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy shrub at right above brown textured bush at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green leafy shrub at right is located above brown textured bush at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e1d50bf2e79564a.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte skirt at center lie behind translucent white dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2fa5eab62cec46c5.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green leafy shrub at right more distant than that of green leafy shrub at center-left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c45d87d49091b6d2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.647, 0.509) (B) (0.599, 0.628)" }, { "from": "gpt", "value": "(A) (0.647, 0.509)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee15a3e6b86e0b26.jpg", "conversations": [ { "from": "human", "value": "\nIs matte pink glasses at upper right above metallic gold glasses at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte pink glasses at upper right is not positioned above metallic gold glasses at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70ca24104750bbb3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.908, 0.138) (B) (0.006, 0.467)" }, { "from": "gpt", "value": "(B) (0.006, 0.467)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/672e1863de86eaa0.jpg", "conversations": [ { "from": "human", "value": "\nIs white smooth suit at center smaller than yellow plastic flashlight at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white smooth suit at center is not smaller than yellow plastic flashlight at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be99583cf64a0a3a.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of gray cotton t-shirt at center less distant than that of striped cotton bed at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fbc187d975c13c1.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray suit at left appear over gray hair suit at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, dark gray suit at left is not above gray hair suit at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fc28470421b222b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) blue water at lower center (B) white bark tree at left" }, { "from": "gpt", "value": "(A) blue water at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1bfd60430183378.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white matte projection screen at center (B) camouflage uniform at center (C) camouflage fabric uniform at center" }, { "from": "gpt", "value": "(A) white matte projection screen at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcaf6a1416c5de62.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.663, 0.344) (B) (0.756, 0.856) (C) (0.240, 0.523)" }, { "from": "gpt", "value": "(C) (0.240, 0.523)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3eb534495d5fdfd1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.139, 0.619) (B) (0.149, 0.464) (C) (0.560, 0.261)" }, { "from": "gpt", "value": "(B) (0.149, 0.464)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da08845573b59279.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) dark blue matte door at center (B) wooden birdhouse at left" }, { "from": "gpt", "value": "(B) wooden birdhouse at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c481856c320febdb.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) beige leather chair at left (B) beige fabric chair at right (C) beige fabric chair at center (D) beige leather chair at center, is positioned closest to the gray cotton shirt at center?" }, { "from": "gpt", "value": "(C) beige fabric chair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9b3cf2598cd836f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) sandy textured hillside at upper center (B) blue fabric shirt at upper left (C) yellow hard hat at center (D) gray matte elephant at center" }, { "from": "gpt", "value": "(B) blue fabric shirt at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c11881dd1003706.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if calico fur cat at center is positioned to the left of white fur cat at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, calico fur cat at center is not to the left of white fur cat at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aff669e02a389132.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.374, 0.469) (B) (0.668, 0.467) (C) (0.878, 0.508) (D) (0.056, 0.520)" }, { "from": "gpt", "value": "(D) (0.056, 0.520)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b533c3e0beabd416.jpg", "conversations": [ { "from": "human", "value": "\nWhere is brown concrete building at left located in relation to metallic blue car at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79029427b5428814.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the white uniformed pitcher at left? (A) wooden bat at center (B) white jersey baseball player at center" }, { "from": "gpt", "value": "(A) wooden bat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddd72b41b4409518.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) brown matte eye at center (B) smooth skin face at center (C) brown matte eye at upper center, is positioned farthest from the brown matte eye at upper left?" }, { "from": "gpt", "value": "(B) smooth skin face at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03e2e4db6b49856f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) clear blue water at left (B) green leafy palm tree at right (C) white sandy beach at center" }, { "from": "gpt", "value": "(B) green leafy palm tree at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fedb6474d3fe04e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the green textured bush at center among (A) yellow-green leafy tree at center-left (B) green needle-like tree at upper right (C) brown rough bark tree at left (D) yellow-green foliage at center-right?" }, { "from": "gpt", "value": "(D) yellow-green foliage at center-right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eafe9aeed1b66d28.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green glossy water at upper left (B) shiny golden leaves at upper right" }, { "from": "gpt", "value": "(A) green glossy water at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0ce2433f04a1435.jpg", "conversations": [ { "from": "human", "value": "\nDoes white concrete pillar at lower right appear on the right side of concrete pillar at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white concrete pillar at lower right is not on the right side of concrete pillar at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a22ec28ebef5fc9d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if fluffy brown monkey at center is wider than orange fur tail at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba2ebd61f54e3f75.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) matte glass building at center (B) beige concrete building at center-left" }, { "from": "gpt", "value": "(A) matte glass building at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/071e580b4dcb0aec.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic silver park bench at upper right is thinner than light blue fabric bench at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, metallic silver park bench at upper right might be wider than light blue fabric bench at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01b7d39d94918800.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte black cannon at left (B) matte black cannon at right (C) beige parchment sign at center" }, { "from": "gpt", "value": "(C) beige parchment sign at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bbecfbd281cdffc5.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of wooden pole at right in relation to gray asphalt pavement at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2a3a551d9a25601.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.861, 0.873) (B) (0.616, 0.272)" }, { "from": "gpt", "value": "(B) (0.616, 0.272)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33ed3bdad3fabe4d.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the matte white shirt at center? Choose from: (A) white matte car at upper center (B) green leafy tree at upper center" }, { "from": "gpt", "value": "(B) green leafy tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44e32aca8778ff74.jpg", "conversations": [ { "from": "human", "value": "\nDoes white soft fabric baby at center lie in front of matte gray sweater at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white soft fabric baby at center is in front of matte gray sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e711e30b44aa21b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the black fabric camera at center? Select from: (A) matte gold jacket at upper center (B) white fabric table at lower left (C) white fabric table at center (D) light brown leather jacket at center" }, { "from": "gpt", "value": "(A) matte gold jacket at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c8e45308deb4359e.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the brown leather chair at left? Choose from: (A) wooden picture frame at upper left (B) gold-framed floral painting at upper right (C) brown leather armchair at center" }, { "from": "gpt", "value": "(B) gold-framed floral painting at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00014131957fa342.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the green needle-like tree at left among (A) white fabric flag at upper right (B) green evergreen tree at left (C) green textured tree at center?" }, { "from": "gpt", "value": "(A) white fabric flag at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ede961798cf6790.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow metallic crane at center is bigger than metallic silver boat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, yellow metallic crane at center is larger in size than metallic silver boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5163b9fc5fe3c7f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the silver metallic tripod at center? Select from: (A) smooth concrete pavement at center (B) matte pink jacket at center" }, { "from": "gpt", "value": "(B) matte pink jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a286dbd686d8412e.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte van at lower right smaller than silver metallic sedan at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white matte van at lower right is not smaller in size than silver metallic sedan at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/682f948cec9e413a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) wooden polished chair at lower left (B) dark wood paneling at left" }, { "from": "gpt", "value": "(B) dark wood paneling at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8437e92430a66fe4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green matte bus at center (B) green matte bus at right" }, { "from": "gpt", "value": "(B) green matte bus at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/140b30499c8306c3.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the matte purple signpost at upper left? Choose from: (A) white plastic signpost at center (B) blue plastic street sign at upper left (C) shiny metallic bicycle at center (D) metallic silver pole at center" }, { "from": "gpt", "value": "(C) shiny metallic bicycle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90c782d7483ce564.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue striped shirt at center is positioned to the right of matte skin at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find blue striped shirt at center to the right of matte skin at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ced7ac2e925baf9e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) metallic silver bicycle at center (B) black matte bicycle at center (C) matte blue t-shirt at center (D) black matte shirt at center" }, { "from": "gpt", "value": "(A) metallic silver bicycle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66a184887bbe678a.jpg", "conversations": [ { "from": "human", "value": "\nIs striped cotton shirt at center wider than gray cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, striped cotton shirt at center is wider than gray cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84207845ce4c5c95.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is dark gray stone stairs at lower center located relative to wooden textured door at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98fb56940a214b89.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the gray rough rock at center? (A) translucent blue water at center (B) red fabric person at center" }, { "from": "gpt", "value": "(A) translucent blue water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee7a1494fe4f692b.jpg", "conversations": [ { "from": "human", "value": "\nDoes velvet santa at left appear over shiny green christmas tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, velvet santa at left is below shiny green christmas tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e24f8146ca5a713a.jpg", "conversations": [ { "from": "human", "value": "\nIs green murky water at lower center closer to the viewer compared to green reflective water at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f08e1d17877bcb1.jpg", "conversations": [ { "from": "human", "value": "\nIs green needle-like at center to the right of green textured evergreen tree at upper center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find green needle-like at center to the right of green textured evergreen tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81b6a19d44e5155a.jpg", "conversations": [ { "from": "human", "value": "\nIs matte skin at center wider than blue glossy eye at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of matte skin at center exceeds that of blue glossy eye at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16fceef3b6cfc065.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.171, 0.261) (B) (0.702, 0.945)" }, { "from": "gpt", "value": "(B) (0.702, 0.945)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58f992a1f7d1f48e.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown rubber oyster at lower left have a smaller size compared to dark matte jacket at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, dark brown rubber oyster at lower left has a smaller size compared to dark matte jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3200c9d112b9cf07.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden bench at center bigger than green wrought iron chair at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, wooden bench at center is not larger than green wrought iron chair at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d01e4180b101432b.jpg", "conversations": [ { "from": "human", "value": "\nIs matte gold mailbox at left bigger than gold matte postbox at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, matte gold mailbox at left is larger in size than gold matte postbox at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a62ee8a94e8f6c44.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at left is wider than stone buildings at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green leafy tree at left is not wider than stone buildings at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/acfc2b26b7ab8259.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black train at left bigger than glassy concrete building at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte black train at left is not larger than glassy concrete building at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87431c245300ab41.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver metallic rail at lower center appear on the left side of white metallic pole at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, silver metallic rail at lower center is to the left of white metallic pole at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc38b05bd42dc0ad.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte shirt at center is smaller than light brown leather hat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, white matte shirt at center might be larger than light brown leather hat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1fdf7a5db875e063.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth black suit at right is positioned to the left of matte black hand at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, smooth black suit at right is not on the left side of matte black hand at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b286bd2bfc59a978.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte t-shirt at center thinner than orange fleece shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white matte t-shirt at center has a lesser width compared to orange fleece shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b664561d6b2f6524.jpg", "conversations": [ { "from": "human", "value": "\nIs green plaid shirt at center above dark blue jeans at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, green plaid shirt at center is below dark blue jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/945a0b2f191bd3a6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.126, 0.333) (B) (0.670, 0.580) (C) (0.923, 0.662)" }, { "from": "gpt", "value": "(A) (0.126, 0.333)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eca2dc8bfa950aa9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear water at pond right is wider than pink blossoming tree at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0576ff7c0ba48202.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of green leafy tree at left in reference to green leafy tree at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a58a12ee757c2f9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) blue ribbed sweater at upper left (B) dark blue sweater at center (C) dark brown dreadlocks at upper right" }, { "from": "gpt", "value": "(A) blue ribbed sweater at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed1529324ceaebf2.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is transparent glass window at upper left located relative to silver metallic gauge at right? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b515003511dbd9c6.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of striped fabric shirt at center in relation to denim shorts at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e350cbe2e2a4e8a1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.509, 0.397) (B) (0.278, 0.572) (C) (0.652, 0.491)" }, { "from": "gpt", "value": "(B) (0.278, 0.572)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c63d34b797eb96bc.jpg", "conversations": [ { "from": "human", "value": "\nIs white plastic computer desk at center positioned in front of black matte mouse at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of black matte mouse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/302d155f254f1dcd.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte tree at center is smaller than clear glass lake at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green matte tree at center occupies less space than clear glass lake at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bff022276c55267.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow mosaic tile building at right behind light gray concrete skyscraper at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68329560859b3dc6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte plastic laptop at center (B) blue shirt at right (C) metallic silver laptop at center" }, { "from": "gpt", "value": "(B) blue shirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1da7c3d455500cf.jpg", "conversations": [ { "from": "human", "value": "\nIs white wood drawer at upper left to the left of white fabric drawer at left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, white wood drawer at upper left is to the right of white fabric drawer at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/308ab12008365e19.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown spotted skin at center is positioned below brown spotted neck at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, brown spotted skin at center is not positioned below brown spotted neck at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5f395e3ba00eb72.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte black jacket at center located relative to white dotted fabric tie at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1707e59c915a42a6.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy plant at center positioned behind green smooth stem at center-right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af59503eabc9d4f6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.808, 0.380) (B) (0.778, 0.983)" }, { "from": "gpt", "value": "(B) (0.778, 0.983)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8af55910a41384d6.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden cabinet at center appear under clear glass wine glass at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27850a2b1f9afd23.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green glossy tree at center is positioned to the left of green matte tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green glossy tree at center is not to the left of green matte tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42fced453355a433.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark brown leather jacket at lower left is bigger than red shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7c6b61f4aedde48.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) green mossy stone wall at lower right (B) blue water at lower right" }, { "from": "gpt", "value": "(B) blue water at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3ef25209b769e09.jpg", "conversations": [ { "from": "human", "value": "\nWhere is smooth black paddle at center located in relation to black smooth paddle at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c41e699aad8820de.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte black hair at upper center (B) matte green sweater at left (C) dark blue sweater at center (D) dark blue shirt at center" }, { "from": "gpt", "value": "(A) matte black hair at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3d07a71ac7824f7.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) shiny red fire truck at center (B) yellow matte fire truck at center, is positioned farthest from the yellow reflective suit at center?" }, { "from": "gpt", "value": "(B) yellow matte fire truck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a93626affdbc0dca.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the gray suit at center? (A) gray fabric jumpsuit at center (B) blue fabric canopy at upper center" }, { "from": "gpt", "value": "(B) blue fabric canopy at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8330d6a44c70b56a.jpg", "conversations": [ { "from": "human", "value": "\nIs matte purple backpack at center below yellow matte flower at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, matte purple backpack at center is located below yellow matte flower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06d0b925d18de399.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) velvet black dress at left (B) velvet black dress at center (C) velvet-like dark blue dress at left (D) velvet maroon dress at right" }, { "from": "gpt", "value": "(D) velvet maroon dress at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9a11bb438ada4d4.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the purple matte suit at center? (A) purple woven tie at center (B) dark blue suit at left (C) dark brown leather jacket at center (D) matte black suit at center" }, { "from": "gpt", "value": "(D) matte black suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2308745e85d34b82.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) green wooden train track at center (B) green reflective water at center" }, { "from": "gpt", "value": "(B) green reflective water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a411f30ed338b7fa.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white plastic table at center is positioned below matte orange shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49d8f58e4b94132f.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of silver/black plastic printer at center in reference to matte silver laptop at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c09594b5a54b3bef.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if natural wood beach chair at center is bigger than matte brown fabric chair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, natural wood beach chair at center is larger in size than matte brown fabric chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c73120d14e88d72.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of brown pinstripe shirt at center and orange shirt at right in the image provided, where is brown pinstripe shirt at center located with respect to orange shirt at right? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a719839b2fbc5fbf.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte patch at center above red leather jacket at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, black matte patch at center is positioned over red leather jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2cb24cbaef04752.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy mound at lower left closer to the viewer compared to brown rough bark tree trunk at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52a41d9b0f807593.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of camouflage fabric uniform at left in relation to black matte video camera at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/620f24c3eec38540.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.043, 0.581) (B) (0.565, 0.570) (C) (0.811, 0.805) (D) (0.190, 0.558)" }, { "from": "gpt", "value": "(C) (0.811, 0.805)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94f8b172aa54a362.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the black matte camera at center? (A) white matte guitar at center (B) plaid shirt vest at center (C) white cotton t-shirt at lower center (D) white matte cap at center" }, { "from": "gpt", "value": "(A) white matte guitar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2d9647e467787bd.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte plastic bowl at left (B) yellow matte rice at upper left (C) white matte shirt at center" }, { "from": "gpt", "value": "(B) yellow matte rice at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c9c067a6cb02103b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) formal suit at upper right (B) green matte jacket at center" }, { "from": "gpt", "value": "(B) green matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b82a0ae2af024256.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.741, 0.797) (B) (0.587, 0.498) (C) (0.463, 0.988)" }, { "from": "gpt", "value": "(C) (0.463, 0.988)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93b9302dc0086891.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if beige stone church at center is positioned to the left of pink fabric at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, beige stone church at center is to the left of pink fabric at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abe1ad2df52a105c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at lower center is positioned above green glass window at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/107c3da55deed345.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown feathered duck at left appear on the left side of brown feathered duck at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, brown feathered duck at left is positioned on the left side of brown feathered duck at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/936514d16ab3a4b1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy plant at center is smaller than transparent glass window at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, green leafy plant at center might be larger than transparent glass window at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c1ee0a2b8c1567f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown cardboard sign at center is positioned to the right of black matte shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find brown cardboard sign at center to the right of black matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed3e8e544f8bd417.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green grass at center (B) matte blue shirt at left" }, { "from": "gpt", "value": "(B) matte blue shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a70637129bb196f7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the shiny silk vest at center? Choose among these: (A) shiny red fabric at center (B) matte black hat at center" }, { "from": "gpt", "value": "(A) shiny red fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7cc9325642e1ef1.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte projection screen at upper center appear under matte black laptop at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/131dc3c0e84146aa.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) transparent glass water at center (B) blue fabric jacket at upper center" }, { "from": "gpt", "value": "(B) blue fabric jacket at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/098007e850cb754d.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red and yellow train at center appear under matte metallic train at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte red and yellow train at center is located below matte metallic train at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2963060ea3cb33dd.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green dotted dress at left and silver metallic hula hoop at center in the image provided, where is green dotted dress at left located with respect to silver metallic hula hoop at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16765c4d112b616b.jpg", "conversations": [ { "from": "human", "value": "\nIs blue patterned robe at center closer to camera compared to black plastic paintball gun at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0056eb61417b2261.jpg", "conversations": [ { "from": "human", "value": "\nDoes metallic chain-link fence at center appear under satin silver sedan at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, metallic chain-link fence at center is not below satin silver sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0eb20efcc6d11e51.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the white matte plate at center among (A) translucent glass bottle at table right (B) wooden table at center?" }, { "from": "gpt", "value": "(B) wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/849807d4eb952afa.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) asphalt road at center (B) white fluffy cloud at upper center" }, { "from": "gpt", "value": "(A) asphalt road at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a32aa90f9f603b3a.jpg", "conversations": [ { "from": "human", "value": "\nIs green felt pool table at center closer to the viewer compared to matte red shirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad9598b583cc7915.jpg", "conversations": [ { "from": "human", "value": "\nDoes sandy beach at center have a lesser width compared to matte red shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, sandy beach at center is not thinner than matte red shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f05c7f96ecae517d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) gray textured eagle at center (B) sculpted stone figure at upper left" }, { "from": "gpt", "value": "(A) gray textured eagle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c071e38062384fb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.619, 0.339) (B) (0.080, 0.314)" }, { "from": "gpt", "value": "(A) (0.619, 0.339)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6138bdc1163b6236.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the green leafy palm tree at left? Select from: (A) blue jeans at center (B) brown textured stone palace at center (C) clear glass water at center" }, { "from": "gpt", "value": "(B) brown textured stone palace at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b98fd140e721f43.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.402, 0.908) (B) (0.740, 0.564) (C) (0.560, 0.113)" }, { "from": "gpt", "value": "(B) (0.740, 0.564)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca397b25bd62fee5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white plastic hut at right (B) yellow wood cabin at center" }, { "from": "gpt", "value": "(B) yellow wood cabin at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/40d9f529c11fadb2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.073, 0.823) (B) (0.695, 0.856)" }, { "from": "gpt", "value": "(A) (0.073, 0.823)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74806699e360c0fa.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of smooth gray rock at center in reference to pink fabric dress at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16817d124f9f6c03.jpg", "conversations": [ { "from": "human", "value": "\nIs gold metallic lampshade at upper center below matte black jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, gold metallic lampshade at upper center is not below matte black jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5222509a84c4d36c.jpg", "conversations": [ { "from": "human", "value": "\nIs velvet red couch at lower center smaller than white dotted dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, velvet red couch at lower center might be larger than white dotted dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c8c59a34b9f2028.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.504, 0.470) (B) (0.333, 0.659) (C) (0.583, 0.658)" }, { "from": "gpt", "value": "(A) (0.504, 0.470)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dcd62913899e3f7e.jpg", "conversations": [ { "from": "human", "value": "\nDoes black synthetic jacket at center have a greater width compared to matte black jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black synthetic jacket at center is wider than matte black jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/404194dd33c69fb2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte wood window frame at upper right (B) matte brown siding at left" }, { "from": "gpt", "value": "(A) matte wood window frame at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24666e22ebfca6f5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) matte black coat at center (B) wooden at left (C) red fabric jacket at center" }, { "from": "gpt", "value": "(C) red fabric jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/284d234e9bd19830.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue shirt at left lie behind black plastic microphone at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca20c8cbb813f0a6.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of matte green shirt at center in reference to vanilla ice cream at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77df3cca4a09d4ae.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the dark hair at lower center from the following options: (A) american flag at center (B) white plastic scoreboard at upper right?" }, { "from": "gpt", "value": "(A) american flag at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88edcf1c62e3e0d4.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray sweater at right appear over red fabric flag at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, gray sweater at right is not positioned above red fabric flag at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ad2373297d9c7b1.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.315, 0.589) (B) (0.593, 0.272)" }, { "from": "gpt", "value": "(A) (0.315, 0.589)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9efac42465055358.jpg", "conversations": [ { "from": "human", "value": "\nDoes soft beige robe at left appear under red fabric hanger at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/845645bd4a02b7fb.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the green matte monitor at center? Choose among these: (A) beige plastic smaky 100 at center (B) brown plastic keyboard at center (C) black plastic smaky 100 at center (D) green leafy plant at left" }, { "from": "gpt", "value": "(D) green leafy plant at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7085589dfe513754.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) blue fabric flag at upper left (B) orange fabric flag at left (C) beige stone clock tower at center (D) white textured clock at upper center" }, { "from": "gpt", "value": "(D) white textured clock at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b365d1bb487f288.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the white fluffy cloud at upper center among (A) white fluffy cloud at upper right (B) green leafy tree at right?" }, { "from": "gpt", "value": "(B) green leafy tree at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73a48b797e2fab40.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the white plastic sign at lower right? Choose among these: (A) shiny black sedan at lower left (B) white glossy taxi at center" }, { "from": "gpt", "value": "(A) shiny black sedan at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29605452fdaeb07e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.734, 0.191) (B) (0.914, 0.314)" }, { "from": "gpt", "value": "(B) (0.914, 0.314)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdbba126c142b152.jpg", "conversations": [ { "from": "human", "value": "\nDoes polished black locomotive at center have a larger size compared to white vapor at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, polished black locomotive at center is not bigger than white vapor at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2efd1d3fe568c32.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the floral dress at lower center from the following options: (A) white cotton shirt at center (B) pale pink fabric at center (C) matte white blouse at center (D) smooth brown sausages at upper right?" }, { "from": "gpt", "value": "(D) smooth brown sausages at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df7342e0da990e3f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.322, 0.542) (B) (0.400, 0.487) (C) (0.462, 0.809) (D) (0.917, 0.848)" }, { "from": "gpt", "value": "(D) (0.917, 0.848)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d764ddd59eac469.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) matte yellow shorts at left (B) black matte shorts at center (C) green matte shorts at right (D) matte black shorts at center" }, { "from": "gpt", "value": "(B) black matte shorts at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c90f506f7d228aa.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black leather jacket at left is positioned to the right of white plastic chair at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black leather jacket at left is not on the right side of white plastic chair at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ee279bee929d3d4.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte brown cardboard box at center appear on the left side of brown paper bag at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte brown cardboard box at center is not to the left of brown paper bag at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a973166922884cb.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown dress at center lie in front of dark brown fabric children at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, dark brown dress at center is in front of dark brown fabric children at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd6d30412d48876e.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow matte surfboard at upper left above matte red surfboard at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c907aafa7d7631f9.jpg", "conversations": [ { "from": "human", "value": "\nIs black leather jacket at center smaller than black plastic sunglasses at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black leather jacket at center is not smaller in size than black plastic sunglasses at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c979904f57b23f25.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.320, 0.825) (B) (0.309, 0.811)" }, { "from": "gpt", "value": "(A) (0.320, 0.825)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9adef9b2e86c6c92.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown earthy dirt field at center is positioned below green leafy tree at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown earthy dirt field at center is below green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e73c83ad7415c83f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.042, 0.256) (B) (0.150, 0.447) (C) (0.583, 0.577) (D) (0.900, 0.494)" }, { "from": "gpt", "value": "(B) (0.150, 0.447)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/970533d0ece6b083.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of denim shorts at center more distant than that of brown fur coat at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/892816f824e15ef9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.794, 0.533) (B) (0.985, 0.189)" }, { "from": "gpt", "value": "(B) (0.985, 0.189)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e720a36a6e6edefd.jpg", "conversations": [ { "from": "human", "value": "\nIs pink fleece blanket at lower center in front of white matte tank top at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is in front of white matte tank top at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80bb92a1b36e82a6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) matte brown cardigan at center (B) dark gray shirt at center" }, { "from": "gpt", "value": "(A) matte brown cardigan at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11bc48202045c331.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black suit at center closer to camera compared to matte black hand at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32495b9cf3ea9117.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the stainless steel refrigerator at center? Choose from: (A) stainless steel oven at left (B) white wood drawer at lower left (C) matte white drawer at lower center" }, { "from": "gpt", "value": "(A) stainless steel oven at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b71836c946b8c2c1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy palm tree at upper right is positioned below matte red suv at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green leafy palm tree at upper right is not below matte red suv at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc59f755c09fb451.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the white fabric shorts at left? Choose from: (A) white cotton shirt at lower left (B) white matte shirt at lower left" }, { "from": "gpt", "value": "(A) white cotton shirt at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e809f65d66cdf20.jpg", "conversations": [ { "from": "human", "value": "\nIs gray cotton t-shirt at center wider than brown wooden barrel at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, gray cotton t-shirt at center is not wider than brown wooden barrel at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8fe3e38469fe338a.jpg", "conversations": [ { "from": "human", "value": "\nDoes light gray fabric shirt at lower right have a greater width compared to blue fabric shirt at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, light gray fabric shirt at lower right is wider than blue fabric shirt at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05a1e9ce01872f95.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte board game at upper right have a larger size compared to matte blue sweater at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, matte board game at upper right has a larger size compared to matte blue sweater at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d607e176308e5b0e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) maroon velvet gown at lower left (B) black matte graduation gown at center, is positioned closest to the purple matte graduation gown at left?" }, { "from": "gpt", "value": "(A) maroon velvet gown at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/020835e4cdc4180a.jpg", "conversations": [ { "from": "human", "value": "\nIs black leather bar stool at center closer to the viewer compared to black leather bar stool at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, black leather bar stool at center is in front of black leather bar stool at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fa551ddf709d597.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny blue peacock at center appear on the right side of green plastic plate at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, shiny blue peacock at center is to the left of green plastic plate at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71414afc6b086fee.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow striped shirt at left is positioned above purple matte shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, yellow striped shirt at left is located above purple matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28063a684c6651f1.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black suit at left come in front of light brown wooden armchair at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67c89d38febc511d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.361, 0.705) (B) (0.449, 0.759)" }, { "from": "gpt", "value": "(A) (0.361, 0.705)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cdf3f061aa6c625c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) gray fur kangaroo at lower center (B) gray fur rabbit at center" }, { "from": "gpt", "value": "(A) gray fur kangaroo at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02d3f32291f4c295.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if glossy blue car at center is positioned below metallic silver car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, glossy blue car at center is positioned under metallic silver car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/485cdf9c51887c68.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grassy hillside at center is bigger than green grass pasture at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b73c0e9b27bdcb7f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.046, 0.762) (B) (0.087, 0.914) (C) (0.952, 0.495) (D) (0.542, 0.925)" }, { "from": "gpt", "value": "(C) (0.952, 0.495)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b700ad771f29ceb.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.068, 0.445) (B) (0.586, 0.670) (C) (0.496, 0.320) (D) (0.444, 0.636)" }, { "from": "gpt", "value": "(A) (0.068, 0.445)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9cb6fc0ebe11ecd0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.865, 0.692) (B) (0.608, 0.978)" }, { "from": "gpt", "value": "(B) (0.608, 0.978)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8557c4b43694573e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.354, 0.528) (B) (0.651, 0.641)" }, { "from": "gpt", "value": "(B) (0.651, 0.641)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75597d114c5b11a4.jpg", "conversations": [ { "from": "human", "value": "\nIs concrete rebar at center behind metallic red tower crane at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a6c0c928a24c40d5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) light brown uniform skirt at lower right (B) light brown fabric jacket at center (C) dark blue jeans at center" }, { "from": "gpt", "value": "(C) dark blue jeans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab18ae140c5e8b7c.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the black matte microphone at left from the following options: (A) black matte microphone at center (B) matte black microphone at center?" }, { "from": "gpt", "value": "(A) black matte microphone at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f0bfdbf74ad9342.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.332, 0.642) (B) (0.474, 0.861) (C) (0.722, 0.816) (D) (0.261, 0.988)" }, { "from": "gpt", "value": "(A) (0.332, 0.642)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01678757d11a7509.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.521, 0.600) (B) (0.981, 0.347) (C) (0.741, 0.536)" }, { "from": "gpt", "value": "(A) (0.521, 0.600)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f274dc15bb2a4198.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.357, 0.891) (B) (0.300, 0.759)" }, { "from": "gpt", "value": "(A) (0.357, 0.891)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85d6b19fd36c6db6.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth metal rail at center appear on the left side of metallic pole at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, smooth metal rail at center is positioned on the left side of metallic pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4429673ef9974c26.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the matte black phone at center? (A) satin silver phone at center (B) transparent glass table at center" }, { "from": "gpt", "value": "(A) satin silver phone at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1a6e6fe12ed9e49.jpg", "conversations": [ { "from": "human", "value": "\nIs gray woolen goat at upper center below blue rubber tire at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, gray woolen goat at upper center is not positioned below blue rubber tire at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00ad1c554e11b6e5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.237, 0.928) (B) (0.009, 0.341)" }, { "from": "gpt", "value": "(B) (0.009, 0.341)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d25e2cb7093d2e8.jpg", "conversations": [ { "from": "human", "value": "\nIs green carved wood figure at center positioned in front of matte black lamp post at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green carved wood figure at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cb9990776c65694.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.756, 0.802) (B) (0.538, 0.434)" }, { "from": "gpt", "value": "(A) (0.756, 0.802)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab555ac4ad52fc96.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the black matte picture frame at upper center among (A) dark matte picture frame at upper left (B) black matte picture frame at upper left?" }, { "from": "gpt", "value": "(B) black matte picture frame at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a2fc45f2fb9146e.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte baseball glove at center have a greater width compared to brown leather glove at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0f004cf588ca08b.jpg", "conversations": [ { "from": "human", "value": "\nDoes white feathered parrot at center have a lesser width compared to smooth skin palm at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white feathered parrot at center is not thinner than smooth skin palm at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb62c4346c93a59e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the wooden table at center? (A) transparent glass table at lower right (B) matte plastic vase at center (C) green matte plant at center" }, { "from": "gpt", "value": "(A) transparent glass table at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6883508e4b349f32.jpg", "conversations": [ { "from": "human", "value": "\nIs gray down jacket at center bigger than yellow metallic tricycle at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, gray down jacket at center is not larger than yellow metallic tricycle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61e6cce99142e98c.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown metal stairs at center appear under rusty metal pipe at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, dark brown metal stairs at center is located below rusty metal pipe at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/575a5229d276992e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.702, 0.722) (B) (0.194, 0.839)" }, { "from": "gpt", "value": "(A) (0.702, 0.722)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/33751d246f1f3f62.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.107, 0.491) (B) (0.042, 0.597)" }, { "from": "gpt", "value": "(B) (0.042, 0.597)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55cf0f0a6c5836ce.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray matte shirt at center have a greater width compared to matte gray shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, gray matte shirt at center is wider than matte gray shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4dc78249850613f0.jpg", "conversations": [ { "from": "human", "value": "\nDoes white paper sign at center have a lesser width compared to green plastic sign at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white paper sign at center is not thinner than green plastic sign at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14ec08c6986b2dca.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the smooth skin face at center among (A) transparent glass spider web at center (B) metallic silver car at center (C) satin black car at center?" }, { "from": "gpt", "value": "(A) transparent glass spider web at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04f1ff34b853b7d5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.456, 0.914) (B) (0.805, 0.884) (C) (0.217, 0.812) (D) (0.937, 0.891)" }, { "from": "gpt", "value": "(D) (0.937, 0.891)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fa19bd8b520c439c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown wood cabin at left is positioned to the left of matte wood hut at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find brown wood cabin at left to the left of matte wood hut at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c03740e7b7176c6d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if rough wooden table at center is smaller than matte brown finger at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff8fd294191d8cc3.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) beige stone wall at lower center (B) light beige stone bell tower at center (C) orange metallic crane at left, is positioned closest to the white stone dome at center?" }, { "from": "gpt", "value": "(B) light beige stone bell tower at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/885a1ee79a8bcf47.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.605, 0.703) (B) (0.454, 0.791)" }, { "from": "gpt", "value": "(A) (0.605, 0.703)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a710ca8d05755b7.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at lower center positioned behind floral silk dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/977e6eb0c8448a80.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black sweater at center have a smaller size compared to striped fabric chair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, matte black sweater at center occupies less space than striped fabric chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf18df8508778298.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green glossy monster truck at center is bigger than white shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green glossy monster truck at center is bigger than white shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e13a84f3673ecbcb.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth concrete curb at right bigger than matte black suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, smooth concrete curb at right is not bigger than matte black suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f721487933e9f712.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.512, 0.681) (B) (0.679, 0.556) (C) (0.221, 0.784)" }, { "from": "gpt", "value": "(B) (0.679, 0.556)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0b640221aeca837.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the white lace umbrella at center? Select from: (A) shiny gold robe at center (B) gold textured robe at center (C) smooth black robe at center" }, { "from": "gpt", "value": "(C) smooth black robe at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96412275fa8f5658.jpg", "conversations": [ { "from": "human", "value": "\nIs white fabric pants at center wider than white cotton cricket bat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8d0d639c8f19d49.jpg", "conversations": [ { "from": "human", "value": "\nIs maroon fabric shirt at center wider than black matte running shoes at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, maroon fabric shirt at center is wider than black matte running shoes at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db638f3c5fe00b9d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) blue plastic sign at lower right (B) white matte signboard at lower center (C) black and white cityscape at center" }, { "from": "gpt", "value": "(B) white matte signboard at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e54717b5c80a9364.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center to the right of green leafy tree at left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green leafy tree at center is positioned on the right side of green leafy tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf3ee1b09639d54e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.785, 0.427) (B) (0.005, 0.478) (C) (0.282, 0.591) (D) (0.540, 0.280)" }, { "from": "gpt", "value": "(B) (0.005, 0.478)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c6e984e3c2dca3c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.536, 0.986) (B) (0.781, 0.802)" }, { "from": "gpt", "value": "(B) (0.781, 0.802)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53af0b6026bf635d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.297, 0.500) (B) (0.572, 0.517)" }, { "from": "gpt", "value": "(B) (0.572, 0.517)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6cedb212cfc352ab.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte table at center is positioned above black leather camera at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, black matte table at center is located above black leather camera at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c70b03f970f5f3a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) matte blue tie at center (B) black matte leggings at center" }, { "from": "gpt", "value": "(A) matte blue tie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b46538c777dc5374.jpg", "conversations": [ { "from": "human", "value": "\nIs rocky at right positioned in front of clear blue water at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of clear blue water at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55254c9e71119c06.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.291, 0.820) (B) (0.619, 0.642)" }, { "from": "gpt", "value": "(A) (0.291, 0.820)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/984b427ac0e09e53.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) light gray sweater at center (B) black matte laptop at center" }, { "from": "gpt", "value": "(A) light gray sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0697a6e544cffb2d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) golden textured leaves at center (B) yellow leafy tree at upper center" }, { "from": "gpt", "value": "(A) golden textured leaves at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/731e226990cdc1f8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.545, 0.348) (B) (0.872, 0.711) (C) (0.209, 0.722) (D) (0.456, 0.394)" }, { "from": "gpt", "value": "(B) (0.872, 0.711)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f8755b7df60b229.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) blue plastic fan at center (B) white plastic computer desk at center" }, { "from": "gpt", "value": "(A) blue plastic fan at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88c3319a788437e8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) wooden desk at center (B) beige plastic printer at center" }, { "from": "gpt", "value": "(A) wooden desk at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47619112dcd5e9b6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte blue shirt at lower left is wider than light blue denim shorts at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, matte blue shirt at lower left might be narrower than light blue denim shorts at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c42229e6339f4953.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy branch at upper left closer to camera compared to green leafy tree at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy branch at upper left is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2d1ce2cf7055840.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the dripping blood text at center? Select from: (A) smokematerial/texture at upper right (B) white text at center" }, { "from": "gpt", "value": "(B) white text at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6d200e329b63ceb.jpg", "conversations": [ { "from": "human", "value": "\nIs brown stone building at center above blue fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, brown stone building at center is positioned over blue fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c427ee54657af277.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) marbled fabric shirt at center (B) floral fabric shirt at center" }, { "from": "gpt", "value": "(B) floral fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d2744399677717c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) green canvas tote at center (B) yellow fabric tote at right" }, { "from": "gpt", "value": "(B) yellow fabric tote at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09723a5b57ee69db.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) pink satin dress at lower left (B) clear crystal tiara at center (C) yellow cotton shirt at upper right" }, { "from": "gpt", "value": "(C) yellow cotton shirt at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffabe139574ec951.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy at center closer to camera compared to green grassy hillside at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dac238edf2da5374.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.531, 0.536) (B) (0.627, 0.486) (C) (0.472, 0.794)" }, { "from": "gpt", "value": "(B) (0.627, 0.486)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f975a41e03782c8.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the wooden bookshelf at upper center from the following options: (A) white matte cup at center (B) dark brown hair at upper right?" }, { "from": "gpt", "value": "(B) dark brown hair at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee9aad80d7440e0e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) golden feathered duckling at center (B) shiny golden duck at lower right (C) golden feathered duck at right" }, { "from": "gpt", "value": "(C) golden feathered duck at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4a390fa2c262f03.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black text at upper left is bigger than matte black text at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black text at upper left is bigger than matte black text at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6aabef2c4a28ec80.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) white marble mermaid at center (B) white marble statue at center" }, { "from": "gpt", "value": "(A) white marble mermaid at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/175411da40c71b3b.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of matte black clothing at center and sunglasses at center in the image provided, where is matte black clothing at center located with respect to sunglasses at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04b39297c4bd36fe.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.559, 0.652) (B) (0.288, 0.827)" }, { "from": "gpt", "value": "(B) (0.288, 0.827)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ca1c01b08bb93ed.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow fabric canopy at center further to camera compared to white plastic table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, yellow fabric canopy at center is further from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3615ce1d2061d160.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth beige skirt at center is smaller than green velvet dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f68aa7c1aed263f2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue textured fabric at right is thinner than shiny dark brown hair at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, blue textured fabric at right's width is not less than shiny dark brown hair at upper left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ac81687f14d2aa6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green mossy ground at center is wider than purple matte flower at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green mossy ground at center is wider than purple matte flower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1aaa7b13321a3b76.jpg", "conversations": [ { "from": "human", "value": "\nDoes glassy steel building at center appear on the left side of white glass building at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, glassy steel building at center is positioned on the left side of white glass building at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b81574f8636737e.jpg", "conversations": [ { "from": "human", "value": "\nIs matte orange jersey at center in front of matte black backpack at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte orange jersey at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb3deff16b2ffce7.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the white glossy table at lower center? Choose from: (A) matte orange shirt at center (B) matte orange dress at center" }, { "from": "gpt", "value": "(B) matte orange dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cfdebd848c94ba77.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.527, 0.808) (B) (0.103, 0.125) (C) (0.831, 0.416) (D) (0.517, 0.388)" }, { "from": "gpt", "value": "(A) (0.527, 0.808)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8600c9a6103d7905.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.975, 0.766) (B) (0.199, 0.984)" }, { "from": "gpt", "value": "(B) (0.199, 0.984)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51ef0f9dc0462c69.jpg", "conversations": [ { "from": "human", "value": "\nIs pink glass lampshade at lower right to the right of pink glass table lamp at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find pink glass lampshade at lower right to the right of pink glass table lamp at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78be6793aad3899f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) blue fabric dress at lower left (B) brown leather harness at left (C) beige fabric robe at center" }, { "from": "gpt", "value": "(B) brown leather harness at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2af6eef3f984366.jpg", "conversations": [ { "from": "human", "value": "\nIs foggy translucent morning fog at left bigger than green frosted grass at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, foggy translucent morning fog at left is larger in size than green frosted grass at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e72c6a89e554a216.jpg", "conversations": [ { "from": "human", "value": "\nDoes camouflage fabric uniform at right appear on the left side of camouflage fabric uniform at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, camouflage fabric uniform at right is to the right of camouflage fabric uniform at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/942e6a62c392aa0a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) clear water at stream center (B) green mossy branch at upper center" }, { "from": "gpt", "value": "(B) green mossy branch at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92265d3f62cdc548.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.326, 0.531) (B) (0.851, 0.322)" }, { "from": "gpt", "value": "(B) (0.851, 0.322)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71985e260c63cded.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if pink matte shirt at center is positioned to the right of metallic red bridge at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, pink matte shirt at center is positioned on the right side of metallic red bridge at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01fc4f9ac85a0193.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at center is smaller than rustic brown deer at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green leafy tree at center has a smaller size compared to rustic brown deer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab4b5ad4406906b2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte shirt at lower right is positioned to the left of stone bridge at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, black matte shirt at lower right is not on the left side of stone bridge at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4a178e53b2956ff.jpg", "conversations": [ { "from": "human", "value": "\nDoes green mossy tree at upper center appear on the right side of gray stone gazebo at center-right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, green mossy tree at upper center is to the left of gray stone gazebo at center-right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7bce5fef0732929.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) blue cotton hoodie at center (B) blue fleece sweatshirt at center (C) paved stone sidewalk at left" }, { "from": "gpt", "value": "(C) paved stone sidewalk at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79026318ed54ce1d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic silver suv at center is smaller than silver metallic car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, metallic silver suv at center is not smaller than silver metallic car at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9a437daac10f85c.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the metallic gray bridge at center among (A) white glossy sailboat at center (B) white sailboat at center?" }, { "from": "gpt", "value": "(A) white glossy sailboat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f236d1e728b8c92c.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of brown textured dirt at center and gray fabric shirt at center in the image provided, where is brown textured dirt at center located with respect to gray fabric shirt at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/920141be4cb7e275.jpg", "conversations": [ { "from": "human", "value": "\nIs white textured balcony at center wider than metallic wire at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white textured balcony at center is not wider than metallic wire at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f6dfca6114b8a36.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) denim jeans at center (B) dark blue shirt at upper center (C) matte red backpack at center (D) dark brown leather jacket at center" }, { "from": "gpt", "value": "(A) denim jeans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3059b3cc8f9f5bf0.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black suit at left below black textured blazer at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte black suit at left is not positioned below black textured blazer at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab7257aafdbc8700.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) shiny red motorcycle at lower left (B) smooth asphalt parking lot at lower center" }, { "from": "gpt", "value": "(A) shiny red motorcycle at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/647a7f5c9c4e3ed3.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the green matte tree at right from the following options: (A) blue fabric person at lower center (B) brown textured trees at upper center?" }, { "from": "gpt", "value": "(B) brown textured trees at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a5d160851757d68.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray fleece sweater at center appear over blue plaid shirt at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, gray fleece sweater at center is positioned over blue plaid shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ec4952e80cc5295.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of striped cotton polo shirt at left in relation to black matte bikini top at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d5a0f07ab7f1936.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of yellow matte clock tower at center in relation to metallic silver clock at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a14394322cf7043d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) red checkered tablecloth at center (B) black satin jacket at left" }, { "from": "gpt", "value": "(B) black satin jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4767d2501dd8184.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the dark brown hair at center among (A) green velvet robe at center (B) green velvet gown at center?" }, { "from": "gpt", "value": "(B) green velvet gown at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea9178c2f0426632.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.624, 0.075) (B) (0.043, 0.523)" }, { "from": "gpt", "value": "(B) (0.043, 0.523)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04edd0d0972fdae4.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the spotted fur giraffe at center among (A) dry grass at center (B) brown textured tree at right?" }, { "from": "gpt", "value": "(B) brown textured tree at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c58e07fd5f9002f.jpg", "conversations": [ { "from": "human", "value": "\nDoes white frosty tree at center appear over white fluffy snow at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white frosty tree at center is above white fluffy snow at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bfb2bf046267b443.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) denim shirt at upper right (B) denim jacket at center (C) matte blue shirt at center" }, { "from": "gpt", "value": "(B) denim jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d912b60fbeb2627.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) shiny black uniform at center (B) dark blue uniform at center" }, { "from": "gpt", "value": "(A) shiny black uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42756f53f8c141c5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) hardcover book at upper center (B) hardcover book at center (C) matte black photograph at left" }, { "from": "gpt", "value": "(C) matte black photograph at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1929e6b4149fc082.jpg", "conversations": [ { "from": "human", "value": "\nIs gray tattooed scorpion at center bigger than black tattooed scorpion at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, gray tattooed scorpion at center is not bigger than black tattooed scorpion at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c7b72a301eab5f8.jpg", "conversations": [ { "from": "human", "value": "\nDoes teal dotted shirt at center lie behind matte red tank top at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7527b3f7250c9e2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.725, 0.422) (B) (0.076, 0.520) (C) (0.011, 0.463) (D) (0.663, 0.561)" }, { "from": "gpt", "value": "(C) (0.011, 0.463)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03ea1494da3a019f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.769, 0.152) (B) (0.552, 0.147) (C) (0.420, 0.336)" }, { "from": "gpt", "value": "(A) (0.769, 0.152)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16572fc3425ed8e4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.731, 0.566) (B) (0.420, 0.461) (C) (0.186, 0.473) (D) (0.945, 0.925)" }, { "from": "gpt", "value": "(C) (0.186, 0.473)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9ce0d016ee7ecd3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.380, 0.695) (B) (0.398, 0.470) (C) (0.535, 0.770) (D) (0.825, 0.419)" }, { "from": "gpt", "value": "(D) (0.825, 0.419)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3997235bbb1e4ef.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the pink fleece jacket at center? (A) pink fleece jacket at left (B) red fleece sweatshirt at center" }, { "from": "gpt", "value": "(A) pink fleece jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0e6b4b7c7b3245d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.552, 0.011) (B) (0.344, 0.136) (C) (0.483, 0.881)" }, { "from": "gpt", "value": "(C) (0.483, 0.881)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5ddce26d7d20d1d.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green forested mountain at center and brown smoke at center in the image provided, where is green forested mountain at center located with respect to brown smoke at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/673c20e6d77ab076.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the green fabric bus stop at lower center? Choose from: (A) brown leather jacket at lower left (B) satin silver suv at lower right (C) white matte jacket at lower center" }, { "from": "gpt", "value": "(A) brown leather jacket at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27c3af7714355867.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of light brown wood table at center in reference to white paper at lower center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/715e1d58d95673e3.jpg", "conversations": [ { "from": "human", "value": "\nIs light blue cotton shirt at center smaller than matte black shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, light blue cotton shirt at center has a smaller size compared to matte black shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1bf74e1cb0ce5f8b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) reflective glass water at center (B) multicolored foliage at center" }, { "from": "gpt", "value": "(A) reflective glass water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d63fb8876d1745e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) teal glossy water at center (B) white metallic rail at lower left (C) smooth concrete dock at center" }, { "from": "gpt", "value": "(B) white metallic rail at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b34151ea21cc388c.jpg", "conversations": [ { "from": "human", "value": "\nDoes bronze statue at center appear under yellowfloralflower at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, bronze statue at center is not below yellowfloralflower at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/93186865a19be213.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is black matte t-shirt at left located relative to black matte shirt at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/163725aa7c81990f.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of metallic silver cars at lower left and matte black jacket at lower right in the image provided, where is metallic silver cars at lower left located with respect to matte black jacket at lower right? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/734568bce285395c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) dark blue shirt at left (B) clear plastic cup at lower center" }, { "from": "gpt", "value": "(B) clear plastic cup at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57d969b962c7c5bb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.778, 0.438) (B) (0.552, 0.381) (C) (0.731, 0.467) (D) (0.333, 0.537)" }, { "from": "gpt", "value": "(A) (0.778, 0.438)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a735c12f75b372fd.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cotton shirt at center is bigger than blue fabric dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, white cotton shirt at center is larger in size than blue fabric dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8800be4d51856ed2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.984, 0.519) (B) (0.430, 0.877)" }, { "from": "gpt", "value": "(B) (0.430, 0.877)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec40d34cf0f8c4e7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) bronze textured lion at center (B) bronze statue at center (C) sculpted bronze lion at center" }, { "from": "gpt", "value": "(A) bronze textured lion at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d048cacf314fa63a.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the white cotton shirt at center? (A) white shirt at center (B) pink striped sweater at left" }, { "from": "gpt", "value": "(A) white shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9be18b3f199c976.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.783, 0.602) (B) (0.109, 0.967) (C) (0.714, 0.259)" }, { "from": "gpt", "value": "(B) (0.109, 0.967)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/935b55db555b5559.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green matte baseball cap at upper left (B) green painted wood bench at center (C) green fleece jacket at left" }, { "from": "gpt", "value": "(B) green painted wood bench at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55c4b28bd5f8b685.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.461, 0.617) (B) (0.455, 0.330) (C) (0.019, 0.541) (D) (0.227, 0.011)" }, { "from": "gpt", "value": "(D) (0.227, 0.011)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1ef41667a6bcad5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth brown tree trunk at left is positioned to the right of green textured tree at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, smooth brown tree trunk at left is to the left of green textured tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/992bf9a66c78a030.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the sunglasses at upper right? (A) bald head at center (B) smooth skin face at center (C) smooth white wings at center" }, { "from": "gpt", "value": "(A) bald head at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8da01ce2ce2c7dc7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.661, 0.361) (B) (0.515, 0.859)" }, { "from": "gpt", "value": "(B) (0.515, 0.859)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78c56597206c66a6.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte glass skyscraper at center have a larger size compared to transparent glass tower at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte glass skyscraper at center is bigger than transparent glass tower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd3521ddea9c755b.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue glossy table at lower left appear on the right side of pearl necklace at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, blue glossy table at lower left is not on the right side of pearl necklace at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/008f8828deb283f2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if snowy white mountain at upper center is thinner than multicolored scarf at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, snowy white mountain at upper center might be wider than multicolored scarf at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f195cbddac023bff.jpg", "conversations": [ { "from": "human", "value": "\nIs green quilted jacket at center positioned in front of matte black jacket at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9943a287936f5f24.jpg", "conversations": [ { "from": "human", "value": "\nIs gray cotton t-shirt at center to the right of brown leather glove at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, gray cotton t-shirt at center is to the left of brown leather glove at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bbb775dbe674d365.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) white marble palace at center (B) white stone building at center" }, { "from": "gpt", "value": "(A) white marble palace at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f03119aa8afd969f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) black striped jacket at upper right (B) striped fabric shirt at left (C) translucent glass at lower left (D) black zip-up jacket at upper right" }, { "from": "gpt", "value": "(B) striped fabric shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04967790ac1874c5.jpg", "conversations": [ { "from": "human", "value": "\nDoes teal fabric armchair at right appear over transparent glass window at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, teal fabric armchair at right is not positioned above transparent glass window at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0797d4f80f3bb6d4.jpg", "conversations": [ { "from": "human", "value": "\nIs matte yellow pepper at center smaller than shiny silver tray at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte yellow pepper at center is not smaller than shiny silver tray at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3419f07695d392ce.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at lower right to the right of green leafy tree at left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green leafy tree at lower right is positioned on the right side of green leafy tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4afd76085dafd51e.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue smooth suit at left have a lesser width compared to metallic silver microphone at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, blue smooth suit at left is not thinner than metallic silver microphone at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b7d3fc8faa473fb.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white marble statue at left (B) white marble statue at center" }, { "from": "gpt", "value": "(A) white marble statue at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c091ae6d20a9f55e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if striped fabric shirt at center is positioned to the right of matte black laptop at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, striped fabric shirt at center is not on the right side of matte black laptop at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d5f568f03fb1bb2.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) white hoodie at center (B) orange fabric jackets at center (C) denim jacket at center (D) striped hoodie at center, is positioned closest to the denim jeans at center?" }, { "from": "gpt", "value": "(C) denim jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b439c276215f9bac.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte plastic poster at center have a lesser width compared to matte black suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte plastic poster at center's width is not less than matte black suit at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98195cc8d5aa98a9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.374, 0.719) (B) (0.314, 0.611)" }, { "from": "gpt", "value": "(A) (0.374, 0.719)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/44fd49d3092203b9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) leather jacket at center (B) orange fabric canopy at upper center" }, { "from": "gpt", "value": "(A) leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd3e6aaae9414156.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) blue glossy pillar at right (B) dark gray jacket at center (C) blue glossy pillar at left" }, { "from": "gpt", "value": "(A) blue glossy pillar at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73f1056ecca806c0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy plant at left is bigger than matte orange church tower at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green leafy plant at left is larger in size than matte orange church tower at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/091120e8fedc742f.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown textured tree at upper left have a smaller size compared to green leafy tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, brown textured tree at upper left is not smaller in size than green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c2f25b1441947a7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the clear glass wine at center? Select from: (A) transparent glass at center (B) matte black suit at center (C) velvet black dress at lower left" }, { "from": "gpt", "value": "(A) transparent glass at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/348c76fe3ec6f410.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte black jacket at right located relative to dark gray jacket at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0706f6cbfcc86194.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) gray fabric waist bag at center (B) green grass at lower center" }, { "from": "gpt", "value": "(B) green grass at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b65cdbc8687b619d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray furry kangaroo at center is bigger than gray fur kangaroo at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, gray furry kangaroo at center is larger in size than gray fur kangaroo at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4f3bf1ebfdb300e.jpg", "conversations": [ { "from": "human", "value": "\nIs white smooth water at center thinner than green leafy trees at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white smooth water at center's width is not less than green leafy trees at right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5aeacdbaf01f0970.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white glass building at center (B) glassy reflective windows at center" }, { "from": "gpt", "value": "(B) glassy reflective windows at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5a0280fbdf495226.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.563, 0.373) (B) (0.629, 0.516) (C) (0.455, 0.281) (D) (0.552, 0.198)" }, { "from": "gpt", "value": "(A) (0.563, 0.373)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0dc7d3f6b9d54f17.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) green sweater at center (B) matte black suit at center" }, { "from": "gpt", "value": "(B) matte black suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c612620dbf1faba.jpg", "conversations": [ { "from": "human", "value": "\nIs brown textured sidewalk at center further to the viewer compared to matte yellow bag at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, brown textured sidewalk at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1107c6c3a05424a5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) dark blue water at center (B) beige stone palace at center" }, { "from": "gpt", "value": "(B) beige stone palace at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55e75431724e9926.jpg", "conversations": [ { "from": "human", "value": "\nDoes green matte leaves at upper right appear on the right side of green leafy tree at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green matte leaves at upper right is positioned on the right side of green leafy tree at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65b89012e582c597.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) thatched straw hut at upper right (B) thatched straw hut at left" }, { "from": "gpt", "value": "(B) thatched straw hut at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9dcda81c95e7ef8c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.997, 0.812) (B) (0.400, 0.458) (C) (0.546, 0.319)" }, { "from": "gpt", "value": "(A) (0.997, 0.812)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb4adc5e0a54a6b7.jpg", "conversations": [ { "from": "human", "value": "\nIs blue shirt at center positioned behind green fabric table at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is behind green fabric table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6f4a6478da1bd7c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.756, 0.964) (B) (0.828, 0.109) (C) (0.958, 0.295)" }, { "from": "gpt", "value": "(C) (0.958, 0.295)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12a33c3bb6567dde.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) stone slate roof hut at right (B) green grassy at center (C) green rough bark tree at center (D) brown woolen jacket at center" }, { "from": "gpt", "value": "(B) green grassy at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b610e86d19da9a1c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) green matte book at center (B) white paper book at center" }, { "from": "gpt", "value": "(B) white paper book at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c7cb2df184345d1.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden bench at lower right to the right of brown fabric bag at lower right from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, wooden bench at lower right is not to the right of brown fabric bag at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b007782d67d40b3.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) white plastic picnic table at center (B) green leafy tree at left (C) white glossy van at center" }, { "from": "gpt", "value": "(A) white plastic picnic table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/157c331aad164ca1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.326, 0.498) (B) (0.437, 0.992) (C) (0.758, 0.706)" }, { "from": "gpt", "value": "(A) (0.326, 0.498)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/72fe7594396b08f8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.287, 0.905) (B) (0.581, 0.389) (C) (0.539, 0.322)" }, { "from": "gpt", "value": "(A) (0.287, 0.905)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c2ba431894d8fd9.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte t-shirt at right smaller than plaid cotton shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8dd06418d570609.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green matte tree at center less distant than that of dark gray matte helicopter at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b7d980424999325.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the knitted sweater at center? (A) matte black bow at center (B) matte yellow fabric at center" }, { "from": "gpt", "value": "(A) matte black bow at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a8e6bfc71659772.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy trees at center below green leafy tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, green leafy trees at center is located below green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/581c3ad380cdda47.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown leather jacket at center come in front of dark blue jeans at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b29f22e69ef3057.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.709, 0.342) (B) (0.729, 0.750)" }, { "from": "gpt", "value": "(A) (0.709, 0.342)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8892b3353b25cf1.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte brick building at center in relation to blue metallic truck at lower left? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4d414b8d63010b2e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic pavement at center is smaller than teal fabric canopy at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, metallic pavement at center has a smaller size compared to teal fabric canopy at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f4c8312caaea18c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte pink dress at center is positioned below sparkly pink dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte pink dress at center is not positioned below sparkly pink dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e75952dfd9eb8da.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) metallic gray bridge at upper left (B) black metal railing at right" }, { "from": "gpt", "value": "(B) black metal railing at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ac0fc247a0a0b70.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) gray rough bark tree trunk at center (B) black asphalt path at lower right" }, { "from": "gpt", "value": "(A) gray rough bark tree trunk at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95ca8ed9962b5121.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white matte building at center (B) brown dusty ground at lower center (C) green fabric dress at center" }, { "from": "gpt", "value": "(C) green fabric dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f16d7f8b498bf889.jpg", "conversations": [ { "from": "human", "value": "\nIs blue matte t-shirt at right above striped cotton shirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0507a2e4375fb2c0.jpg", "conversations": [ { "from": "human", "value": "\nIs black sequined dress at upper center thinner than black sequined dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, black sequined dress at upper center's width is not less than black sequined dress at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/310d8f8825215d8a.jpg", "conversations": [ { "from": "human", "value": "\nDoes black floral dress at center appear under white fabric at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black floral dress at center is not below white fabric at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffeef40b36fb00c3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) brown leather jacket at center (B) shiny chrome motorcycle at center (C) gray cobblestone pavement at center (D) dark blue jacket at center" }, { "from": "gpt", "value": "(C) gray cobblestone pavement at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/751703ca6e8813c2.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of pink hair at left in reference to black matte microphone at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b012815314fe0e17.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the pink floral fabric dress at center? (A) matte black dress at center (B) leopard print fabric dress at left" }, { "from": "gpt", "value": "(B) leopard print fabric dress at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc62777a283d6d54.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte red coat at left have a greater width compared to matte red jacket at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte red coat at left is wider than matte red jacket at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f77da25e2c8cf7a8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white matte fish at lower center (B) fuzzy white cat at center" }, { "from": "gpt", "value": "(A) white matte fish at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9cd985660c1a512c.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow reflective safety vest at lower center bigger than yellow reflective safety vest at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/548ca2b5d7d595b8.jpg", "conversations": [ { "from": "human", "value": "\nIs matte plastic tambourine at center below green leafy vegetables at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte plastic tambourine at center is below green leafy vegetables at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb798670241ee552.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brown furry monkey at center (B) grayish-brown fur monkey at center" }, { "from": "gpt", "value": "(B) grayish-brown fur monkey at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/18da2a825f4c9c8f.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the dark green sweater at left? Choose from: (A) red sweater at center (B) light green sweater at center (C) green corduroy dress at center" }, { "from": "gpt", "value": "(A) red sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2825ac07db7590f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) checkered fabric shirt at center (B) matte black hat at center (C) black matte shirt at center" }, { "from": "gpt", "value": "(B) matte black hat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bb002f61403b8aa.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the blue fabric cap at upper center? (A) gray fabric jacket at upper right (B) dark hair at lower left (C) black denim jeans at upper center (D) orange t-shirt at upper center" }, { "from": "gpt", "value": "(A) gray fabric jacket at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83c7fe901620fc72.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte shirt at center is smaller than purple glitter socks at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, green matte shirt at center might be larger than purple glitter socks at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0adf5e6bb9ceafb5.jpg", "conversations": [ { "from": "human", "value": "\nDoes camouflage fabric shirt at center appear over pink gingham dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, camouflage fabric shirt at center is positioned over pink gingham dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5179ffe65b863bc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte uniform at center is positioned below matte black helmet at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green matte uniform at center is positioned under matte black helmet at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/473889f75b32308e.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of white concrete lighthouse at center more distant than that of clear water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6ab4bb306a791f2.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the clear glass window at upper center from the following options: (A) matte glass window at upper left (B) clear glass window at center?" }, { "from": "gpt", "value": "(A) matte glass window at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae92e6a06311a377.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.736, 0.628) (B) (0.469, 0.036)" }, { "from": "gpt", "value": "(A) (0.736, 0.628)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ce435a96099e576.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if autumn leaves at center is smaller than dark blue water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, autumn leaves at center is not smaller in size than dark blue water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12088de51c882cb2.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the black matte jacket at upper right among (A) matte blue jacket at center (B) white matte baseball cap at upper center?" }, { "from": "gpt", "value": "(A) matte blue jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b399e0fa08e53f6c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.245, 0.281) (B) (0.573, 0.195) (C) (0.863, 0.953)" }, { "from": "gpt", "value": "(A) (0.245, 0.281)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/462991cd3b3e61b8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the purple glass table at center? Choose among these: (A) white glossy shirt at upper center (B) transparent glass sphere at center" }, { "from": "gpt", "value": "(B) transparent glass sphere at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1be5103f34edf59.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green shrubbery at center is wider than green succulent at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green shrubbery at center is wider than green succulent at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34258f26e20f4fea.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.422, 0.781) (B) (0.185, 0.625)" }, { "from": "gpt", "value": "(A) (0.422, 0.781)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca03ecb5aea35054.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) clear glass window at lower right (B) black stone column at left (C) transparent glass window at upper center (D) clear glass window at upper center" }, { "from": "gpt", "value": "(B) black stone column at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1144b0a6c1e46e77.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red cooler at center bigger than green matte plant at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte red cooler at center is larger in size than green matte plant at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bafcf20a748f172.jpg", "conversations": [ { "from": "human", "value": "\nIs blue fleece jacket at center wider than blue fleece sweatshirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a656ad7dcc48929b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) green leafy tree at lower left (B) green leafy olive tree at center (C) green leafy tree at center" }, { "from": "gpt", "value": "(C) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/423d107c6c43f441.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.135, 0.628) (B) (0.485, 0.627)" }, { "from": "gpt", "value": "(B) (0.485, 0.627)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/175e710db2d1b3ef.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue liquid water at upper right is thinner than camo shorts at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/899012f5eea7c719.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue face at right have a lesser width compared to matte blue face at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte blue face at right is thinner than matte blue face at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5af9313ff3ffd85.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the black glossy portrait at upper left? Choose among these: (A) dark gray suit at left (B) blue snakeskin blouse at center (C) pink fabric microphone at center (D) black matte microphone at center" }, { "from": "gpt", "value": "(C) pink fabric microphone at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ac1beacdef99cfc.jpg", "conversations": [ { "from": "human", "value": "\nDoes red matte stop sign at left appear on the right side of red plastic stop sign at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, red matte stop sign at left is to the right of red plastic stop sign at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30b436f1b23ab3f5.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte red mailbox at center located relative to white wooden bench at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/078b26b8ce0ce758.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) white glass tower at center (B) green leafy tree at lower left" }, { "from": "gpt", "value": "(B) green leafy tree at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df596e5257fe0912.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown dirt track at center is smaller than black wood cabin at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, brown dirt track at center is not smaller in size than black wood cabin at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15daf8b4b62fc7e3.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of rusty metal ring at center in reference to dark gray hoodie at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c075d741205ca26.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.400, 0.613) (B) (0.812, 0.306)" }, { "from": "gpt", "value": "(A) (0.400, 0.613)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b91e40e681fca18.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark blue suit at center is smaller than dark suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, dark blue suit at center occupies less space than dark suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a1c19d571b6a529.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown stone building at right is thinner than blue denim shorts at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, brown stone building at right might be wider than blue denim shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c64788856050482.jpg", "conversations": [ { "from": "human", "value": "\nIs white fabric tank top at center closer to the viewer compared to blue cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white fabric tank top at center is behind blue cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43e392d4baa7f68a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte text at center is positioned above dark suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white matte text at center is above dark suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76af9270493e18ae.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.756, 0.208) (B) (0.683, 0.405)" }, { "from": "gpt", "value": "(A) (0.756, 0.208)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f507f2951add07a.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at upper center come in front of brown feathered bird at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is in front of brown feathered bird at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9e3b6df0db598bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.654, 0.334) (B) (0.235, 0.641)" }, { "from": "gpt", "value": "(A) (0.654, 0.334)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2340fa7bbfa3ff3.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray stone steps at center have a greater width compared to gray stone wall at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, gray stone steps at center is wider than gray stone wall at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3959f66f098ba4b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) brown furry dog at center (B) green grassy field at center" }, { "from": "gpt", "value": "(A) brown furry dog at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/510d24038577cfa6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.898, 0.675) (B) (0.242, 0.628)" }, { "from": "gpt", "value": "(A) (0.898, 0.675)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f7bf691f7a0b3f8.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue fabric shirt at center appear under matte black camera bag at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, blue fabric shirt at center is not below matte black camera bag at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/21b93401fd1e4bd1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) dark blue jeans at lower right (B) shiny silver sedan at center" }, { "from": "gpt", "value": "(A) dark blue jeans at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e5ddb1f55c23b10.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of brown fuzzy kitten at center in reference to light brown fur at left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/422841c57ae4a223.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the matte red onesie at right? Select from: (A) matte red onesie at left (B) matte red onesie at center (C) matte red shirt at center" }, { "from": "gpt", "value": "(A) matte red onesie at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c83cea7139fa70b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.939, 0.184) (B) (0.491, 0.109)" }, { "from": "gpt", "value": "(B) (0.491, 0.109)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01bde80d70e5dce2.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) blue denim jeans at lower right (B) matte black shirt at center" }, { "from": "gpt", "value": "(B) matte black shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ee169e95d403e4a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny maroon convertible at center is positioned to the right of shiny dark brown convertible at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, shiny maroon convertible at center is to the right of shiny dark brown convertible at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/102b6648b5bd79f9.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow matte shirt at center wider than silver metallic rail at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, yellow matte shirt at center is wider than silver metallic rail at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0acf70024e74b6c6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if teal matte/deckbus at left is bigger than white signboard at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, teal matte/deckbus at left is not larger than white signboard at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82772c6ed5c8d5a2.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy table at center appear under white ceramic mug at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, white glossy table at center is located below white ceramic mug at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7415428b306b20ca.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dark gray fabric at center (B) white matte balloon at upper right" }, { "from": "gpt", "value": "(A) dark gray fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/881ed46950ad1864.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray pinstripe suit at left positioned at the back of silky maroon dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fb3c2aae0d716ad.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.043, 0.991) (B) (0.845, 0.617)" }, { "from": "gpt", "value": "(B) (0.845, 0.617)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4df8a7ea37a8a869.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if plaid shirt at center is positioned above matte red shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, plaid shirt at center is not above matte red shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/635ed9a0fe98874c.jpg", "conversations": [ { "from": "human", "value": "\nIs white leather bag at center above white leather bag at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white leather bag at center is above white leather bag at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13719d83bcf49422.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the black leather jacket at left? (A) black leather jacket at center (B) dark blue jeans at center" }, { "from": "gpt", "value": "(B) dark blue jeans at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02fe7f5371ff5283.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.273, 0.025) (B) (0.132, 0.048)" }, { "from": "gpt", "value": "(A) (0.273, 0.025)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70765ddeb3537dbb.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green matte jacket at center and black matte tripod at lower right in the image provided, where is green matte jacket at center located with respect to black matte tripod at lower right? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7dc5f72bb0030553.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.917, 0.405) (B) (0.705, 0.481) (C) (0.652, 0.334) (D) (0.555, 0.348)" }, { "from": "gpt", "value": "(D) (0.555, 0.348)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/316732883524354c.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange fabric banner at upper left have a greater width compared to red silk flag at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c4b5fbc9ce498ecc.jpg", "conversations": [ { "from": "human", "value": "\nIs blue matte mountain bike at center wider than matte blue helmet at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, blue matte mountain bike at center has a greater width compared to matte blue helmet at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5904374ca9b0da71.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.652, 0.250) (B) (0.874, 0.683) (C) (0.300, 0.214)" }, { "from": "gpt", "value": "(B) (0.874, 0.683)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a5ae6b2fba494047.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark blue velvet vest at center is smaller than velvet black vest at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d1b053159ba432b.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue water at center come behind green leafy palm tree at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is behind green leafy palm tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d10247250af819d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden table at center is positioned above dark blue fabric business suit at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, wooden table at center is not positioned above dark blue fabric business suit at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd5c3942e7d0b943.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is shiny black guitar at center located relative to metallic red electric guitar at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15bb627f3106050b.jpg", "conversations": [ { "from": "human", "value": "\nIs floral cotton shirt at center further to the viewer compared to green striped shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of green striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce5c733b623270be.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.427, 0.928) (B) (0.300, 0.039)" }, { "from": "gpt", "value": "(A) (0.427, 0.928)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c116c2654efd7f2.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) stone bridge at center (B) greenish water at center" }, { "from": "gpt", "value": "(A) stone bridge at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbac589699b58393.jpg", "conversations": [ { "from": "human", "value": "\nDoes purple matte shirt at center have a larger size compared to white shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, purple matte shirt at center is bigger than white shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37eff4f461056405.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.761, 0.733) (B) (0.734, 0.758) (C) (0.286, 0.709) (D) (0.930, 0.697)" }, { "from": "gpt", "value": "(D) (0.930, 0.697)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/833a6ed3d92d311e.jpg", "conversations": [ { "from": "human", "value": "\nIs red polished wood decker bus at center thinner than light beige wood airplane at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, red polished wood decker bus at center has a lesser width compared to light beige wood airplane at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1cfb46a704f4fde.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte blue shirt at left (B) light green t-shirt at center" }, { "from": "gpt", "value": "(B) light green t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc83d78d80b30b93.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.637, 0.809) (B) (0.385, 0.812)" }, { "from": "gpt", "value": "(A) (0.637, 0.809)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fba246d30906c62b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy statue at center is bigger than white glossy statue at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white glossy statue at center is not larger than white glossy statue at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0f48990bdd68a31a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if stained glass window at center is positioned to the left of multicolored stained glass at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find stained glass window at center to the left of multicolored stained glass at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c1165f6b089816c.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray cotton shorts at right wider than dark blue shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, dark gray cotton shorts at right is wider than dark blue shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83a25c7d57884394.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the black leather jacket at center? Choose among these: (A) light brown hair at center (B) blue fleece jacket at center (C) white plastic street sign at upper center" }, { "from": "gpt", "value": "(B) blue fleece jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98fb5c8a01fbfbfd.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.455, 0.947) (B) (0.423, 0.350) (C) (0.759, 0.909)" }, { "from": "gpt", "value": "(C) (0.759, 0.909)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5920f2975a4ce6a4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) white plastic chair at center (B) metallic silver basketball hoop at right" }, { "from": "gpt", "value": "(A) white plastic chair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c03d83b085a17bb.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the black fabric shirt at lower center? Choose among these: (A) light blue shirt at lower right (B) blue shorts at lower right (C) brown wool sweater at lower center (D) white matte projector screen at upper center" }, { "from": "gpt", "value": "(D) white matte projector screen at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6daeba7ceb7bd46d.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the white textured blazer at center? (A) black suit at center (B) dark gray suit at center" }, { "from": "gpt", "value": "(B) dark gray suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/014af34d74c77416.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white plastic bus stop at left in reference to blue plastic sign at upper right? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc2e60de24ebf96f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.250, 0.530) (B) (0.539, 0.347) (C) (0.766, 0.366) (D) (0.662, 0.936)" }, { "from": "gpt", "value": "(A) (0.250, 0.530)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc4c50866f12b1a1.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black microphone at center have a larger size compared to white glossy shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, matte black microphone at center has a larger size compared to white glossy shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/92104ddba18c5dc8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.913, 0.656) (B) (0.674, 0.708) (C) (0.664, 0.803) (D) (0.033, 0.866)" }, { "from": "gpt", "value": "(D) (0.033, 0.866)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3f2b20584587c3f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.334, 0.423) (B) (0.225, 0.364)" }, { "from": "gpt", "value": "(B) (0.225, 0.364)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/725dbcc95324dcbb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white smooth line at center is smaller than shiny orange helmet at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white smooth line at center is not smaller in size than shiny orange helmet at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c89b6e05c302462f.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue blazer at upper left to the left of brown felt fedora at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte blue blazer at upper left is to the left of brown felt fedora at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a72a9f5de06fb84.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the green leafy tree at center? (A) bare wood tree at center (B) green leafy tree at left" }, { "from": "gpt", "value": "(B) green leafy tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52c3c42b899b1462.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the orange/gray fabric tent at center? Choose from: (A) orange/white mesh tent at left (B) brown textured tree at center" }, { "from": "gpt", "value": "(A) orange/white mesh tent at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee82e57ec42646c5.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte shirt at center lie in front of white matte uniform at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white matte shirt at center is in front of white matte uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a6a6b3f9b36fd4f.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is pink matte tank top at center located relative to blue rubber yoga mat at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b4fe2938b83786cb.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden acoustic guitar at center have a smaller size compared to black metallic microphone at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, wooden acoustic guitar at center might be larger than black metallic microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3176e13f7aae5baa.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte black ski at left located in relation to white rubber snowshoe at lower center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e6af2bf26529856.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue fabric shorts at lower right is positioned to the left of white matte jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, blue fabric shorts at lower right is not to the left of white matte jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8f2f9ea900c2391.jpg", "conversations": [ { "from": "human", "value": "\nIs green mossy rock at lower left bigger than rocky waterfall at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green mossy rock at lower left is not bigger than rocky waterfall at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/020dfff43822d7ee.jpg", "conversations": [ { "from": "human", "value": "\nIs blue metallic bridge at center smaller than matte red train at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, blue metallic bridge at center might be larger than matte red train at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ca857d10c8ceb24.jpg", "conversations": [ { "from": "human", "value": "\nDoes green ribbed shirt at right lie behind white matte plate at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15895893871af795.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) black plastic camera at right (B) matte gray jacket at upper right" }, { "from": "gpt", "value": "(A) black plastic camera at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/488bedfecaa7abd3.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny black sedan at center smaller than green leafy palm tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, shiny black sedan at center is smaller than green leafy palm tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e07207202fb2d283.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the shiny dark green sedan at center? Choose from: (A) green plastic sign at upper center (B) green glass traffic light at upper center (C) metallic gray sedan at center" }, { "from": "gpt", "value": "(B) green glass traffic light at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc695c0b52811b2e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) black satin skirt at center (B) brown cotton shirt at lower left (C) black fabric uniform at center" }, { "from": "gpt", "value": "(C) black fabric uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32dc3a52824337be.jpg", "conversations": [ { "from": "human", "value": "\nDoes green translucent water at center appear on the right side of black rubber paddle at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green translucent water at center is positioned on the right side of black rubber paddle at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e78f751782efb2a.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown jacket at center appear over khaki fleece jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d123ccfa9c484120.jpg", "conversations": [ { "from": "human", "value": "\nIs rocky cliff at center to the right of translucent glass waterfall at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find rocky cliff at center to the right of translucent glass waterfall at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3d6c42d74b3042ce.jpg", "conversations": [ { "from": "human", "value": "\nIs thatched straw hut at center positioned before white printed shirt at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is behind white printed shirt at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/914ffc3abd6e0663.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow grass at center is thinner than rustic sandstone rock formation at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e92feb2ad3e82e17.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) yellow-green painted pole at center (B) green plastic street sign at upper center (C) multicolored painted building at center" }, { "from": "gpt", "value": "(A) yellow-green painted pole at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f238e964aa8b1c14.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny metallic bicycle at center is bigger than white matte bicycle helmet at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, shiny metallic bicycle at center is not bigger than white matte bicycle helmet at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50f7d255cfb12a66.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.779, 0.222) (B) (0.534, 0.533) (C) (0.913, 0.713)" }, { "from": "gpt", "value": "(C) (0.913, 0.713)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/17b7e6199d2c9025.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) concrete sidewalk at lower left (B) smooth orange tree at center (C) gray concrete path at lower right (D) green grass at center" }, { "from": "gpt", "value": "(B) smooth orange tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51a910c0db1fc4c5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) white pleated dress at left (B) floral dress at right (C) matte brown guitar at center (D) matte gray dress at right, is positioned farthest from the blue plaid shorts at right?" }, { "from": "gpt", "value": "(A) white pleated dress at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce83a8c09a0036e4.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white ice at center in reference to black wool coat at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ee9cc38ff220e36.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.848, 0.816) (B) (0.983, 0.869)" }, { "from": "gpt", "value": "(B) (0.983, 0.869)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4eb7ede9e7088523.jpg", "conversations": [ { "from": "human", "value": "\nIs brown satin dress at center above light beige shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, brown satin dress at center is below light beige shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a36be4f7532b9ec.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.644, 0.516) (B) (0.720, 0.248) (C) (0.097, 0.556) (D) (0.380, 0.867)" }, { "from": "gpt", "value": "(B) (0.720, 0.248)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f736b34c8b9d5a8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the mahogany wood door at center? Choose among these: (A) black wrought iron balcony at upper center (B) polished metal balustrade at center" }, { "from": "gpt", "value": "(B) polished metal balustrade at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e6821c22d1048a6.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte shirt at center to the right of translucent plastic glass at right from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, black matte shirt at center is to the left of translucent plastic glass at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d83ec83295e066d2.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent glass pillar at center above red matte jacket at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e2f43ef03ecefe22.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) black matte sunglasses at right (B) black matte sunglasses at lower right (C) brown sand at lower right" }, { "from": "gpt", "value": "(C) brown sand at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0f009b5d431dacc.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of dry grass at center and green leafy tree at upper left in the image provided, where is dry grass at center located with respect to green leafy tree at upper left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56bee3cc5eb19f7c.jpg", "conversations": [ { "from": "human", "value": "\nDoes silhouette bare tree at center have a lesser width compared to white textured snow at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, silhouette bare tree at center's width is not less than white textured snow at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65dac0e534603c5c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) floral-patterned scarf at center (B) black fabric scarf at center, is positioned farthest from the white matte jacket at center?" }, { "from": "gpt", "value": "(B) black fabric scarf at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/da423c3bb128c447.jpg", "conversations": [ { "from": "human", "value": "\nDoes white stone relief at left have a larger size compared to white stone carving at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white stone relief at left has a larger size compared to white stone carving at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b20a882c24be5a7.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the wooden picket fence at lower right from the following options: (A) white fluffy snow at lower center (B) gray woodshed at left?" }, { "from": "gpt", "value": "(B) gray woodshed at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bebcbfaaa9268c15.jpg", "conversations": [ { "from": "human", "value": "\nIs green metal rail at center closer to the viewer compared to green corrugated pipe at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9f35aa1ad1bfc2f.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny black bike at lower right to the right of matte black t-shirt at left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, shiny black bike at lower right is to the right of matte black t-shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/484a87359905aa2d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow/yellow striped jersey at center is positioned below dark blue jersey at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1c2af5bc12fb8bd.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white fluffy snowman at center located relative to black mesh fire pit at lower left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd5ae57f074e316f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue glossy water at center is wider than asphalt road at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eafa254e3a6c72f3.jpg", "conversations": [ { "from": "human", "value": "\nDoes rough bark tree trunk at center appear on the right side of smooth gray bark at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, rough bark tree trunk at center is not to the right of smooth gray bark at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/673ec3114e2490bf.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue suit at center have a smaller size compared to sparkly beige dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, dark blue suit at center might be larger than sparkly beige dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db0367511020b3b3.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the metallic silver gear at center? Choose from: (A) polished silver rim at center (B) silver metallic rim at center" }, { "from": "gpt", "value": "(A) polished silver rim at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fe76f616c02f177.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is brown rough wood pole at left located relative to brown wood pole at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80cbe7ac6edce6b5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) brown cardboard golf cart at center (B) white satin dress at center, is positioned closest to the pink silk bouquet at center?" }, { "from": "gpt", "value": "(B) white satin dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c01b574c274fb3f4.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at lower center bigger than smooth brown tree trunk at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green grass at lower center is bigger than smooth brown tree trunk at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b64bed0b777b2ab2.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) white glossy flower at center (B) translucent amber glass vase at center (C) white matte flower at center" }, { "from": "gpt", "value": "(B) translucent amber glass vase at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/510fe0a57ea16d71.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.672, 0.487) (B) (0.222, 0.356)" }, { "from": "gpt", "value": "(B) (0.222, 0.356)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2aac8f09768b670.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of purple fabric at center and smooth blonde hair at center in the image provided, where is purple fabric at center located with respect to smooth blonde hair at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee482d68780bbf45.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) dark gray jacket at center-right (B) matte black jacket at left, is positioned farthest from the smooth concrete pavement at center?" }, { "from": "gpt", "value": "(A) dark gray jacket at center-right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13f983e935abc264.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.309, 0.403) (B) (0.244, 0.620) (C) (0.330, 0.339)" }, { "from": "gpt", "value": "(B) (0.244, 0.620)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65fe3992e286811e.jpg", "conversations": [ { "from": "human", "value": "\nIs brown stone building at center thinner than stone steeple at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, brown stone building at center might be wider than stone steeple at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4b068d8b5f4be1e0.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of blue fabric shoe at upper left in relation to blue fabric pants at upper center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/488d931befd25340.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if concrete at center is thinner than green matte car at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a110d9f96e7dd6dc.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.389, 0.470) (B) (0.103, 0.872)" }, { "from": "gpt", "value": "(A) (0.389, 0.470)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98980568f8517ec3.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the shiny blue bikini top at center? (A) matte silver bikini top at left (B) shiny blue sequins bikini top at center" }, { "from": "gpt", "value": "(A) matte silver bikini top at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c271531d5ab1582.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow cotton pants at center positioned before dark brown leather jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e29def49b58b0e28.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) smooth skin face at center (B) translucent white angel at upper right" }, { "from": "gpt", "value": "(B) translucent white angel at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bcf6d44cd69daca.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte khaki shirt at center located in relation to black matte clipboard at center in the image? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f010f14414ba500.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown fabric shirt at center have a greater width compared to matte red t-shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, brown fabric shirt at center might be narrower than matte red t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ba11c5e2d57bf7f.jpg", "conversations": [ { "from": "human", "value": "\nIs dark water at center closer to camera compared to white glossy boat at center-right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39e78d1207e3d192.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.265, 0.006) (B) (0.927, 0.155) (C) (0.641, 0.039)" }, { "from": "gpt", "value": "(A) (0.265, 0.006)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07949561f6398d7d.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue jersey at center have a larger size compared to black matte knee pad at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte blue jersey at center is larger in size than black matte knee pad at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1e6d9e5bd5186a51.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) yellow matte building at left (B) yellow stone building at center" }, { "from": "gpt", "value": "(A) yellow matte building at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74978abbcd0a559a.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center have a lesser width compared to white matte windmill at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b334370338d177a.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the matte black t-shirt at left among (A) black leather jacket at center (B) black leather jacket at right?" }, { "from": "gpt", "value": "(A) black leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/439abb1865a41e44.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black tank top at center to the left of blue fabric shirt at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black tank top at center is to the left of blue fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fb5437c76fca39b.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white ceramic cup at upper center located in relation to silver metallic fork at lower center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76baa94cbaf3fb60.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent glass door at center come behind white paper sign at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, transparent glass door at center is behind white paper sign at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8154d60c6346651c.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the dark brown hair at lower center? (A) yellow metallic traffic light at upper center (B) matte red truck at center (C) light brown hair at center" }, { "from": "gpt", "value": "(B) matte red truck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51461e9fce7bcd3e.jpg", "conversations": [ { "from": "human", "value": "\nIs dark glossy jar at left to the right of orange matte at upper center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, dark glossy jar at left is not on the right side of orange matte at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9de991852caedcfa.jpg", "conversations": [ { "from": "human", "value": "\nIs stone gothic cathedral at center bigger than dark gray sweater at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, stone gothic cathedral at center is larger in size than dark gray sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68d71b25198f5aec.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.144, 0.442) (B) (0.487, 0.362) (C) (0.851, 0.425)" }, { "from": "gpt", "value": "(B) (0.487, 0.362)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d3066f4a2e03a59.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) silver metallic car at left (B) denim jacket at right (C) beige felt cowboy hat at center (D) blue denim jeans at center" }, { "from": "gpt", "value": "(C) beige felt cowboy hat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6956b5571282a641.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) chocolate cake at right (B) smooth skin face at right (C) white cotton shirt at right (D) white porcelain plate at lower right" }, { "from": "gpt", "value": "(D) white porcelain plate at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6fbc4f7f8b634ef3.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) matte red shirt at left (B) red checkered shirt at right" }, { "from": "gpt", "value": "(B) red checkered shirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8487d3bdfd446648.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is blue sweater at center located relative to matte brown sweater at upper right? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8e0f44b1e8c2c3e.jpg", "conversations": [ { "from": "human", "value": "\nDoes black leather boot at center have a greater width compared to glossy patent leather boot at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of black leather boot at center exceeds that of glossy patent leather boot at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b15ee48f2db4d87.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cotton shirt at center is positioned above brown fur dog at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, white cotton shirt at center is located above brown fur dog at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a4c8524c6b871bc.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte orange pillow at left appear on the left side of striped shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte orange pillow at left is to the left of striped shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d8e523cfa411965.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of matte floral dress at left and white shirt at center in the image provided, where is matte floral dress at left located with respect to white shirt at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/076a1d834bcd1da0.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.566, 0.906) (B) (0.387, 0.941)" }, { "from": "gpt", "value": "(B) (0.387, 0.941)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/278fb12582052b46.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy hedge at center have a greater width compared to gray concrete sidewalk at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green leafy hedge at center has a greater width compared to gray concrete sidewalk at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94849ff170faf547.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.826, 0.969) (B) (0.249, 0.738) (C) (0.142, 0.720) (D) (0.409, 0.762)" }, { "from": "gpt", "value": "(A) (0.826, 0.969)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5214f638f57d5d8f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.549, 0.463) (B) (0.648, 0.547)" }, { "from": "gpt", "value": "(B) (0.648, 0.547)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/483de519d2d16d50.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth brown bark at center in front of brown speckled feathers at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, smooth brown bark at center is in front of brown speckled feathers at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b624659c7b8c6cf6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) chocolate matte pig at center (B) white fondant cupcake with panda decoration at center (C) purple glossy cupcake at center (D) matte white cupcake with blue candies at center" }, { "from": "gpt", "value": "(D) matte white cupcake with blue candies at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d8516c8bfe4e7a47.jpg", "conversations": [ { "from": "human", "value": "\nDoes stainless steel pot at upper right come behind wooden countertop at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83c453f9d6deeadc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green matte shirt at center is positioned to the left of orange-brown fur tiger at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, green matte shirt at center is not on the left side of orange-brown fur tiger at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/072cbcd06e0b60c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white feathered bird at upper right (B) white fabric sailboat at upper center" }, { "from": "gpt", "value": "(A) white feathered bird at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/653be75726a53046.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dark green leafy tree at lower left (B) smooth bark tree at center" }, { "from": "gpt", "value": "(A) dark green leafy tree at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f567fd59289dfbec.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the glossy glass window at upper center among (A) glossy plastic face at center (B) glossy metallic car window at upper center?" }, { "from": "gpt", "value": "(B) glossy metallic car window at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86bd0a274f9e39e7.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green grass at lower center located in relation to green leafy tree at center in the image? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6eed0537128371e1.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) orange matte/orange at center (B) brown leather jacket at center (C) leather jacket at lower center (D) black leather jacket at upper center" }, { "from": "gpt", "value": "(C) leather jacket at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f429e84bec8428b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) wooden at lower right (B) black woolen scarf at lower right" }, { "from": "gpt", "value": "(A) wooden at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c1f81b8cab39133.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the white cotton glove at center? Choose from: (A) brown fabric chair at right (B) white matte hand at center (C) satin red headscarf at upper left (D) smooth pink fabric at lower center" }, { "from": "gpt", "value": "(A) brown fabric chair at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8531cd29a088e5d.jpg", "conversations": [ { "from": "human", "value": "\nIs blue cardboard mask at center thinner than blue paper mask at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, blue cardboard mask at center might be wider than blue paper mask at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c9b778d0be5525f.jpg", "conversations": [ { "from": "human", "value": "\nIs stained glass lampshade at upper center above stained glass dome at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, stained glass lampshade at upper center is not positioned above stained glass dome at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5c0f61c000fece6a.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white matte shirt at center (B) white matte projection screen at upper center (C) dark brown fabric at center" }, { "from": "gpt", "value": "(C) dark brown fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a481e11beb5fe456.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear blue water at center come behind green leafy trees at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of green leafy trees at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01a191ae3f0b20b7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.588, 0.459) (B) (0.014, 0.509) (C) (0.219, 0.353)" }, { "from": "gpt", "value": "(B) (0.014, 0.509)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b7ad18e3e816a26.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green leafy tree at upper center and clear glass window at center in the image provided, where is green leafy tree at upper center located with respect to clear glass window at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c98cd3d2e33859b5.jpg", "conversations": [ { "from": "human", "value": "\nIs black jersey at left to the right of yellow matte volleyball at upper center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, black jersey at left is not on the right side of yellow matte volleyball at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3dca46257be6b4ed.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray fur cat at upper right is positioned below gray fur cat at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, gray fur cat at upper right is not below gray fur cat at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf14e73d89398396.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) green bark tree at left (B) gray hair at center" }, { "from": "gpt", "value": "(A) green bark tree at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d1ca5a3671a6726.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.562, 0.725) (B) (0.253, 0.622)" }, { "from": "gpt", "value": "(A) (0.562, 0.725)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/deff67c4f3d734a9.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent glass window at right appear under transparent glass window at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, transparent glass window at right is located below transparent glass window at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d27305854dc99632.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) silhouette leafy palm at upper center (B) silhouette leafy palm at right (C) silhouette leafy palm at left (D) silhouette leafy palm at center" }, { "from": "gpt", "value": "(D) silhouette leafy palm at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7f0c0a7fb91717c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) glossy blue scooter at center (B) matte blue helmet at upper left" }, { "from": "gpt", "value": "(A) glossy blue scooter at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9f945613e1a802b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) black glossy shirt at center (B) dark gray suit at right (C) matte black suit at center" }, { "from": "gpt", "value": "(A) black glossy shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/22db9d8d75740082.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) rusty wrought iron sculpture at center (B) gray concrete pavement at center, is positioned closest to the smooth brown pole at right?" }, { "from": "gpt", "value": "(A) rusty wrought iron sculpture at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70ed5d71ee3bba6b.jpg", "conversations": [ { "from": "human", "value": "\nIs white plastic refrigerator at lower right thinner than brown matte pasta at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b95e7cce9405d17.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the brown velvet deer at right from the following options: (A) brown velvet deer at center (B) brown velvet deer at left (C) brown velvet antlered deer at center?" }, { "from": "gpt", "value": "(C) brown velvet antlered deer at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/057431a5452f3f85.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the pearl necklace at upper right from the following options: (A) green glass bottle at center (B) transparent glass at upper center (C) white matte shirt at center?" }, { "from": "gpt", "value": "(B) transparent glass at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f8ef2ed4becc247.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the black leather dog at center? Choose from: (A) shiny coral dress at left (B) shiny silver dress at center (C) matte black suit at right (D) matte gray suit at center" }, { "from": "gpt", "value": "(B) shiny silver dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/356faa292469f2d6.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue shirt at center have a lesser width compared to matte blue globe at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte blue shirt at center's width is less than matte blue globe at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff6819a136ccb59c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green patina metal sculpture at center is positioned above green matte van at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green patina metal sculpture at center is not above green matte van at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4ff3d9b77c59d91.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the gray rough rock at center? Choose among these: (A) golden fur monkey at left (B) fuzzy brown monkey at center" }, { "from": "gpt", "value": "(B) fuzzy brown monkey at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afc2b8b924617661.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the black plastic camera at center? Choose among these: (A) blonde hair at lower right (B) blue matte jacket at center" }, { "from": "gpt", "value": "(B) blue matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c33faa0b2bf56b1c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.515, 0.436) (B) (0.972, 0.758)" }, { "from": "gpt", "value": "(A) (0.515, 0.436)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6c4e2d72efe2831.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.343, 0.392) (B) (0.717, 0.391)" }, { "from": "gpt", "value": "(A) (0.343, 0.392)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/153258978d1fda77.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white glossy bathtub at upper left (B) orange wood window at upper left" }, { "from": "gpt", "value": "(A) white glossy bathtub at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12a18db3189dac0e.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of satin dress at center more distant than that of red satin bouquet at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of red satin bouquet at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3a0f04a44bae8b2.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue sweater at left have a larger size compared to black velvet coat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19c7212e764e60ac.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray fabric bag at lower right have a lesser width compared to green fabric jacket at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, gray fabric bag at lower right's width is less than green fabric jacket at lower left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0197b5048a0c0b2c.jpg", "conversations": [ { "from": "human", "value": "\nIs ivory lace dress at upper right further to the viewer compared to white plastic blinds at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, ivory lace dress at upper right is in front of white plastic blinds at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b505230705f1adbb.jpg", "conversations": [ { "from": "human", "value": "\nDoes white marble column at center appear over white marble column at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, white marble column at center is located above white marble column at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30e51069d95a8dc8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) light brown leather jacket at center (B) black leather jacket at upper center (C) smooth black hair at upper center (D) black textured suitcase at center" }, { "from": "gpt", "value": "(D) black textured suitcase at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ffcf5a5a4603a0c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) orange fabric backpack at center (B) blue fabric cap at center, is positioned closest to the dark gray shirt at upper center?" }, { "from": "gpt", "value": "(A) orange fabric backpack at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eea396ed0111e07e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear glass water at center is positioned below matte black backpack at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, clear glass water at center is located below matte black backpack at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bc29180d6d979e0.jpg", "conversations": [ { "from": "human", "value": "\nDoes white foam paper towel at lower left come behind silver metallic ring at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/209d61cf21c96438.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the striped wool scarf at right from the following options: (A) floral fabric scarf at lower left (B) floral fabric at left?" }, { "from": "gpt", "value": "(A) floral fabric scarf at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e362b5e39c75816.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.571, 0.264) (B) (0.708, 0.353) (C) (0.449, 0.305)" }, { "from": "gpt", "value": "(A) (0.571, 0.264)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b934ba158d5491d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.820, 0.291) (B) (0.605, 0.630)" }, { "from": "gpt", "value": "(A) (0.820, 0.291)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6486eff374f61392.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the green matte folder at upper right? (A) green striped shirt at center (B) leather jacket at left" }, { "from": "gpt", "value": "(B) leather jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a5540102f7ca2d1.jpg", "conversations": [ { "from": "human", "value": "\nDoes white paper book at center have a larger size compared to beige cardboard box at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white paper book at center is bigger than beige cardboard box at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1321f8641953f10e.jpg", "conversations": [ { "from": "human", "value": "\nDoes black smooth dog at left have a greater width compared to plaid fabric pillow at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, black smooth dog at left is wider than plaid fabric pillow at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d88bd236a481efb9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) black glossy car at left (B) satin metallic car at center" }, { "from": "gpt", "value": "(A) black glossy car at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d2a8b014f96349d.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) wooden park bench at center (B) white cotton shirt at right (C) blue denim jacket at lower right (D) wooden park bench at lower left" }, { "from": "gpt", "value": "(D) wooden park bench at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b29cefd7f4fcb06.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte dress at center smaller than matte black t-shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5aeca0be4eeda7b9.jpg", "conversations": [ { "from": "human", "value": "\nIs gray matte water at center wider than green leafy branch at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of gray matte water at center exceeds that of green leafy branch at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f153e8780c1f3bb5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.896, 0.845) (B) (0.823, 0.770)" }, { "from": "gpt", "value": "(B) (0.823, 0.770)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a32ad3cf6ca79623.jpg", "conversations": [ { "from": "human", "value": "\nIs black polished piano at left above velvet-patterned armchair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e30c9696d2124cfb.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) matte black dress at center (B) dark blue uniform at left (C) white shirt at center (D) matte black suit at center" }, { "from": "gpt", "value": "(A) matte black dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd78a1aafec054f3.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) gray metallic train track at lower center (B) green plastic train track at lower center" }, { "from": "gpt", "value": "(B) green plastic train track at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9bdd42677510d0d3.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black jacket at center appear over plaid flannel shirt at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte black jacket at center is not positioned above plaid flannel shirt at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09ced56ccb88ae7e.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue shorts at left below matte black surfboard at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, matte blue shorts at left is located below matte black surfboard at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a020f8a6ced615a.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green leafy hedge at lower left and green leafy bush at upper right in the image provided, where is green leafy hedge at lower left located with respect to green leafy bush at upper right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/05d8aaf15ffd2078.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow fabric cap at center in front of blue striped shirt at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is in front of blue striped shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc0f6d6056075680.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the burnt wood tree at center? Choose from: (A) green spiky plant at center (B) green spiky plant at left (C) charcoal-textured dirt field at center (D) bare wood tree at upper right" }, { "from": "gpt", "value": "(D) bare wood tree at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a41790a826ed5666.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of stone clock tower at center and metallic gray clock at center in the image provided, where is stone clock tower at center located with respect to metallic gray clock at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43a2d80333dd0a8d.jpg", "conversations": [ { "from": "human", "value": "\nIs clear glassy water at center wider than white sand beach at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of clear glassy water at center exceeds that of white sand beach at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23e085cb5eb0d080.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.310, 0.375) (B) (0.956, 0.259)" }, { "from": "gpt", "value": "(A) (0.310, 0.375)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/947847f3e06c4aac.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) dark green trees at center (B) pink translucent clouds at upper center (C) smooth water at center" }, { "from": "gpt", "value": "(B) pink translucent clouds at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b440dedfa6cba28.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white wood shutter at left is positioned to the left of white wooden shutter at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white wood shutter at left is to the left of white wooden shutter at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3547df2e3930ab7.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at lower left thinner than green matte shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a51af861511addd.jpg", "conversations": [ { "from": "human", "value": "\nDoes green painted wood at left appear under white painted wood at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2cf8ae4e266b5a5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white wooden bridge at center (B) clear water at lower center" }, { "from": "gpt", "value": "(A) white wooden bridge at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46ca15942caa0113.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.958, 0.345) (B) (0.545, 0.058) (C) (0.368, 0.480)" }, { "from": "gpt", "value": "(C) (0.368, 0.480)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ca69d0d3f4f4652.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the smooth wood stairs at lower left? Choose among these: (A) wooden deck at center (B) matte wood log cabin at center" }, { "from": "gpt", "value": "(A) wooden deck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c379e06f2101ee67.jpg", "conversations": [ { "from": "human", "value": "\nDoes white paper schedule at center have a lesser width compared to yellow paper-like labor day weekend poster at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white paper schedule at center's width is not less than yellow paper-like labor day weekend poster at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9610a0ff4185b06.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.665, 0.530) (B) (0.191, 0.614)" }, { "from": "gpt", "value": "(A) (0.665, 0.530)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a87d7d1ec01a4063.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) light blue shirt at left (B) matte blue shirt at center (C) gray cotton polo shirt at center (D) white shirt at center" }, { "from": "gpt", "value": "(D) white shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed4d3c37d01e8c11.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue t-shirt with dog print at center thinner than wooden bookshelf at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte blue t-shirt with dog print at center is not thinner than wooden bookshelf at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06641e34ca8e375a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte paper map at left is wider than black matte jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/244ba9e00f937900.jpg", "conversations": [ { "from": "human", "value": "\nDoes silhouette horse at center have a lesser width compared to silhouette horse at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, silhouette horse at center's width is less than silhouette horse at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c4ed6786be324fc.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of black matte shirt at center in relation to brown leather glove at right? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6c4f629111409aa.jpg", "conversations": [ { "from": "human", "value": "\nDoes red matte shirt at center have a lesser width compared to light brown hair at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, red matte shirt at center's width is not less than light brown hair at lower center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a768b7edcdf59a75.jpg", "conversations": [ { "from": "human", "value": "\nIs dark blue down jacket at center positioned at the back of teal fleece jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b89c58e5750f4c4f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.388, 0.237) (B) (0.782, 0.467) (C) (0.644, 0.706) (D) (0.005, 0.252)" }, { "from": "gpt", "value": "(B) (0.782, 0.467)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e45859c530e71cbc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth blonde hair at center is thinner than pink matte lips at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, smooth blonde hair at center is not thinner than pink matte lips at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a33a3ef96f845ebf.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) silver metallic laptop at center (B) gray concrete at center" }, { "from": "gpt", "value": "(B) gray concrete at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b774d5f3f56cd05.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if floral fabric blouse at center is wider than striped cotton shirt at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of floral fabric blouse at center exceeds that of striped cotton shirt at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c86a8413ddd6dc6.jpg", "conversations": [ { "from": "human", "value": "\nWhere is black synthetic jacket at center located in relation to dark green puffy jacket at right in the image? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/073a6c3279bfc868.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of gray-white fur dog at center less distant than that of white and black fur at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb1782e6fa023ccb.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.833, 0.972) (B) (0.831, 0.653) (C) (0.118, 0.994) (D) (0.398, 0.891)" }, { "from": "gpt", "value": "(C) (0.118, 0.994)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0242e93f0164f31c.jpg", "conversations": [ { "from": "human", "value": "\nIs frosted brown tree at upper left behind smooth concrete pillars at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3a43a639fc14bdb9.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the green mossy rock at center? (A) green water at upper center (B) white porous rock at left" }, { "from": "gpt", "value": "(B) white porous rock at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d60433aec6e0a41c.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the brown wooden pole at upper center? (A) smooth gray rock at center (B) brown wooden rail at lower left" }, { "from": "gpt", "value": "(A) smooth gray rock at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48d0da75d2384b01.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.509, 0.739) (B) (0.147, 0.717) (C) (0.441, 0.811) (D) (0.256, 0.277)" }, { "from": "gpt", "value": "(C) (0.441, 0.811)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8de7ac3f7b5df00.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) matte black suit at center (B) clear acrylic table at center (C) white glossy exhaust hood at upper center" }, { "from": "gpt", "value": "(B) clear acrylic table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fcda482711d199a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white marble statue at center is bigger than white marble cherub at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, white marble statue at center is larger in size than white marble cherub at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4cd35a9395e9668a.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of shiny silver necklace at upper right in relation to white lace blouse at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bef1521432076dc.jpg", "conversations": [ { "from": "human", "value": "\nDoes snow-covered tree at center have a smaller size compared to white matte bench at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, snow-covered tree at center is not smaller than white matte bench at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/763eeb8c29f81fb4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.144, 0.759) (B) (0.604, 0.786)" }, { "from": "gpt", "value": "(B) (0.604, 0.786)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29941f0ba1e725b6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.227, 0.519) (B) (0.898, 0.380)" }, { "from": "gpt", "value": "(A) (0.227, 0.519)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fc945f67ee93ba8.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden table at center appear over pink fleece jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c09ec16588f2d12a.jpg", "conversations": [ { "from": "human", "value": "\nIs blue smooth water at center bigger than metallic gray bridge at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, blue smooth water at center is not bigger than metallic gray bridge at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e57b45b274c05f6c.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is gray rock waterfall at center located relative to matte pink flower at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1ff5099ec81c311.jpg", "conversations": [ { "from": "human", "value": "\nIs thatched straw hut at center wider than woven wood fence at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b85e31f6471b4696.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy branches at upper left thinner than green leafy tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c134900b14ea92f.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of gray cotton shorts at right in reference to wooden sign at upper right? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c861b68f99aea31d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) black fuzzy paw at lower right (B) black fur paw at lower left (C) black fleece dog bed at center" }, { "from": "gpt", "value": "(B) black fur paw at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a530c46821a39630.jpg", "conversations": [ { "from": "human", "value": "\nIs clear water at center positioned before white cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of white cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e25ec5e2ba8004b.jpg", "conversations": [ { "from": "human", "value": "\nDoes plaid cotton shirt at center have a greater width compared to superman t-shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, plaid cotton shirt at center might be narrower than superman t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/008e3a8fdca8dd20.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white matte boat at center (B) dark brown fleece at center (C) camouflage jacket at left" }, { "from": "gpt", "value": "(A) white matte boat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc861fe331f459e3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the light blue fabric dress at center? Choose among these: (A) light blue fabric at center (B) matte white shirt at center (C) pale skin hand at center" }, { "from": "gpt", "value": "(A) light blue fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d51cd0e2920bff86.jpg", "conversations": [ { "from": "human", "value": "\nIs dusty gravel path at center wider than matte black backpack at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae71aed992aafc48.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.440, 0.673) (B) (0.566, 0.886)" }, { "from": "gpt", "value": "(B) (0.566, 0.886)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/422278a2556ea640.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte leaf at center to the right of green textured frog at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, green matte leaf at center is to the left of green textured frog at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83c58694816beb31.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) green mossy bark tree at left (B) silver metallic railing at center (C) green leafy tree at center (D) metallic staircase at center" }, { "from": "gpt", "value": "(B) silver metallic railing at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8172e39fdb09c5a0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) shiny brown horse at center (B) brown sandy dirt at center, is positioned farthest from the floral-patterned fabric at center?" }, { "from": "gpt", "value": "(B) brown sandy dirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b77c665ad6421ce.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at center is positioned above green matte tree at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green leafy tree at center is located above green matte tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d29d75a8895a3598.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at lower left wider than metallic silver streetlight at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2b242da33cbe88c.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the matte black tank top at center? Choose from: (A) purple soft lavender at lower center (B) smooth skin head at center" }, { "from": "gpt", "value": "(A) purple soft lavender at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/735734abb7200606.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black/yellow fabric tent at center is positioned to the left of yellow t-shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, black/yellow fabric tent at center is to the right of yellow t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70299bb89f5c98b0.jpg", "conversations": [ { "from": "human", "value": "\nIs white fluffy cloud at upper center smaller than brown dry grass at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ab97652ded0ea8e.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of brown brick pavement at center and teak wood chair at center in the image provided, where is brown brick pavement at center located with respect to teak wood chair at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/610cdb9ab4254a20.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black skateboard at center appear under black worn skateboard at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, matte black skateboard at center is above black worn skateboard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/781fee4d3bd4341c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if coarse rope net at center is positioned to the right of transparent water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, coarse rope net at center is not to the right of transparent water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5bc2087a05cb0fc5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte black jacket at left (B) black matte jacket at left (C) yellow matte jacket at center" }, { "from": "gpt", "value": "(C) yellow matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04c4d69476d77def.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) smooth skin face at center (B) blonde curly hair at upper left" }, { "from": "gpt", "value": "(A) smooth skin face at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2cc698dbd9126475.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue denim jeans at lower right is bigger than green leafy plant at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/763644ec63f85bba.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green needle-like tree at left and green textured pine at center in the image provided, where is green needle-like tree at left located with respect to green textured pine at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5a23219a1a190f9.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte shirt at center smaller than dark purple shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white matte shirt at center is not smaller in size than dark purple shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bed5e0aa318ae70c.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark brown leather jacket at lower center come behind red jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of red jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0b0e635f131f645.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white smooth monument at center is positioned above white matte cross at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white smooth monument at center is not above white matte cross at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f098ceaa143061c7.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark gray jacket at right lie in front of blue fleece jacket at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37e954622f002f63.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.671, 0.511) (B) (0.379, 0.766) (C) (0.672, 0.586)" }, { "from": "gpt", "value": "(B) (0.379, 0.766)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19020eec2acf61c3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte plastic bulletin at center (B) matte silver bulletin at center (C) blue paper poster at center" }, { "from": "gpt", "value": "(A) matte plastic bulletin at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d63a00686866d553.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the green textured tree at upper center from the following options: (A) green glossy tree at upper left (B) green leafy tree at left?" }, { "from": "gpt", "value": "(A) green glossy tree at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06f5677342a6cbb5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white textured cardigan at center (B) gray fleece sweater at left (C) pink matte sweater at center" }, { "from": "gpt", "value": "(C) pink matte sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/df62e5a49897a5bb.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at left above green grass at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green leafy tree at left is positioned over green grass at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9998cbe807f17c96.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.606, 0.673) (B) (0.853, 0.617)" }, { "from": "gpt", "value": "(A) (0.606, 0.673)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29db5dcf235b6f0c.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue train at center appear on the left side of black gravel at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte blue train at center is to the left of black gravel at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8794b94ebe53ee00.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.533, 0.577) (B) (0.487, 0.423)" }, { "from": "gpt", "value": "(B) (0.487, 0.423)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0ba762b9eb48f4f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.731, 0.845) (B) (0.299, 0.834)" }, { "from": "gpt", "value": "(B) (0.299, 0.834)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3f5b615a7102ccb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white matte boat at center (B) blue water at dock center" }, { "from": "gpt", "value": "(A) white matte boat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6a0a89398fb5fa4.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) transparent glass at center (B) white plastic license plate at center" }, { "from": "gpt", "value": "(A) transparent glass at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a0260d53590d052.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green grass at center is bigger than green textured pine tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green grass at center has a larger size compared to green textured pine tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/263c15a5904110a7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) plaid fabric crop top at center (B) plaid fabric shirt at center (C) denim shorts at center" }, { "from": "gpt", "value": "(A) plaid fabric crop top at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/902c828e961d486b.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte gray blouse at upper left have a smaller size compared to metallic silver microphone at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, matte gray blouse at upper left might be larger than metallic silver microphone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6fc8a7a79ff9ebac.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) black fleece jacket at center (B) gray fleece sweatshirt at center" }, { "from": "gpt", "value": "(A) black fleece jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e14720b740dbdf8c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dark gray stone clock at center (B) stone steeple at left" }, { "from": "gpt", "value": "(A) dark gray stone clock at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86061c0ccd5d9f98.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown matte jacket at center have a smaller size compared to light blue fabric at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7465bf52ca16d4b.jpg", "conversations": [ { "from": "human", "value": "\nDoes vibrant floral dress at center have a greater width compared to black jersey dress at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of vibrant floral dress at center exceeds that of black jersey dress at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d984533dabbd84a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if weathered wood bench at center is positioned above weathered wood log at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, weathered wood bench at center is located above weathered wood log at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9db578cff707f21.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is gray stone pedestal at center located relative to polished bronze statue at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7773a0ee3924dba5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) porcelain tea pot at center (B) porcelain vase with floral design at left" }, { "from": "gpt", "value": "(B) porcelain vase with floral design at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/90f2fc441f7a06a8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue cotton t-shirt at center is wider than gray cotton t-shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of blue cotton t-shirt at center exceeds that of gray cotton t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d9164bddbee2b6e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if metallic gold chair at right is positioned below wooden violin at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aca6a30e6b1b0546.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the shiny black sedan at center right? (A) shiny black sedan at lower left (B) silver metallic van at lower left" }, { "from": "gpt", "value": "(B) silver metallic van at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d878a3899a93158.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent plastic hand at center above white clay at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, transparent plastic hand at center is positioned over white clay at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c69b365b84f1c70a.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at upper left lie in front of brown wooden sign at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green leafy tree at upper left is behind brown wooden sign at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3884d07e18f9beca.jpg", "conversations": [ { "from": "human", "value": "\nDoes thatched roof hut at upper center lie in front of thatched roof shelter at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, thatched roof hut at upper center is behind thatched roof shelter at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c611d21db4748985.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black shirt at center is positioned to the right of brown feathered bird at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, matte black shirt at center is to the left of brown feathered bird at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cad7d70e54f4d0aa.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.268, 0.281) (B) (0.189, 0.670)" }, { "from": "gpt", "value": "(B) (0.189, 0.670)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f96162bb2d1e5415.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the matte wooden nesting doll at center? (A) white matte mouse at lower left (B) yellow matte glue stick at center" }, { "from": "gpt", "value": "(A) white matte mouse at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d34bf0826d1b04a7.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.669, 0.830) (B) (0.019, 0.100) (C) (0.907, 0.472) (D) (0.972, 0.394)" }, { "from": "gpt", "value": "(A) (0.669, 0.830)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e931e4ae8a0641c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.130, 0.983) (B) (0.737, 0.633)" }, { "from": "gpt", "value": "(B) (0.737, 0.633)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/485fb3ac15421384.jpg", "conversations": [ { "from": "human", "value": "\nDoes brushed metal knife at lower left have a greater width compared to smooth brown rock at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, brushed metal knife at lower left is wider than smooth brown rock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6542d09fdb8cfeaf.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray stone statue at center have a larger size compared to granite statue at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e000057831071917.jpg", "conversations": [ { "from": "human", "value": "\nIs rough stone boulder at center above orange safety vest at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, rough stone boulder at center is located above orange safety vest at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f6b7b0b766c5ec92.jpg", "conversations": [ { "from": "human", "value": "\nDoes white painted wood pole at center appear under white painted pole at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white painted wood pole at center is not positioned below white painted pole at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e50f72213187ec4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.528, 0.428) (B) (0.181, 0.561)" }, { "from": "gpt", "value": "(A) (0.528, 0.428)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fc8ef7d8b735387f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) maroon plush vest at center (B) denim jacket at left" }, { "from": "gpt", "value": "(A) maroon plush vest at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/596c70657f4fd9ba.jpg", "conversations": [ { "from": "human", "value": "\nIs blue suit at center thinner than bald head at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, blue suit at center might be wider than bald head at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd644ef7661fcd94.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.576, 0.628) (B) (0.634, 0.698) (C) (0.509, 0.633)" }, { "from": "gpt", "value": "(C) (0.509, 0.633)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/131389c84cf0abec.jpg", "conversations": [ { "from": "human", "value": "\nIs gray fabric shirt at upper right positioned at the back of black matte jacket at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, gray fabric shirt at upper right is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7500733141885d12.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green textured tree at center and green leafy tree at left in the image provided, where is green textured tree at center located with respect to green leafy tree at left? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2bbcd56348a3374c.jpg", "conversations": [ { "from": "human", "value": "\nIs matte white projector screen at center to the right of black matte laptop at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte white projector screen at center is to the right of black matte laptop at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a44607fe593c61c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the matte blue polo shirt at center? Select from: (A) blue button-up shirt at center (B) purple striped polo shirt at center" }, { "from": "gpt", "value": "(B) purple striped polo shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77980dbae006cd7a.jpg", "conversations": [ { "from": "human", "value": "\nDoes metallic glass bell tower at center appear on the left side of smooth concrete dock at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, metallic glass bell tower at center is to the left of smooth concrete dock at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1016ede674a031e.jpg", "conversations": [ { "from": "human", "value": "\nIs rubber ball pit at center bigger than blue matte shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, rubber ball pit at center is larger in size than blue matte shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f830f82c15c4654f.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the green leafy tree at right? Choose from: (A) pink fabric flower at left (B) green smooth lawn at center (C) green leafy tree at center" }, { "from": "gpt", "value": "(C) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/218b2fddb16b8df0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) green leafy tree at lower left (B) dark gray concrete building at left (C) brown stone building at center (D) green leafy tree at upper right" }, { "from": "gpt", "value": "(C) brown stone building at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d2cb7d49a09c4c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.435, 0.480) (B) (0.015, 0.536)" }, { "from": "gpt", "value": "(A) (0.435, 0.480)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c8825304621c6ec.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray cotton t-shirt at center have a lesser width compared to black pinstripe suit at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, gray cotton t-shirt at center's width is not less than black pinstripe suit at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d850210379410db0.jpg", "conversations": [ { "from": "human", "value": "\nDoes leopard print pants at right have a greater width compared to leopard print suitcase at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, leopard print pants at right has a greater width compared to leopard print suitcase at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a5631b787004838.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow matte church at center is bigger than golden spire at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, yellow matte church at center is not larger than golden spire at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff34c2766b572e59.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if translucent glass at center is wider than blue plaid shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84d7d9c96712f376.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) light blue cotton shirt at left (B) white cotton shirt at right" }, { "from": "gpt", "value": "(B) white cotton shirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/322f56cec9803a3b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) black rubber goggles at center (B) red and white plastic sunglasses at center (C) reflective plastic sunglasses at center (D) white mesh fence at center" }, { "from": "gpt", "value": "(D) white mesh fence at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04e61a16167112a7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.580, 0.044) (B) (0.628, 0.098) (C) (0.735, 0.372)" }, { "from": "gpt", "value": "(B) (0.628, 0.098)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fc18a766d91d6f2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.892, 0.953) (B) (0.655, 0.150) (C) (0.950, 0.519)" }, { "from": "gpt", "value": "(A) (0.892, 0.953)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/004ac8c6da80cd56.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte black blazer at center (B) white shirt with tie at upper right (C) white smooth table at center" }, { "from": "gpt", "value": "(C) white smooth table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14e6d36b96aa37f0.jpg", "conversations": [ { "from": "human", "value": "\nIs red jacket at center further to camera compared to black shirt at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, red jacket at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a738e679fe46eb99.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.417, 0.312) (B) (0.970, 0.544) (C) (0.756, 0.878)" }, { "from": "gpt", "value": "(C) (0.756, 0.878)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10ad51bfa36bcb2d.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink paisley fabric top at upper right have a greater width compared to black smooth hair at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of pink paisley fabric top at upper right exceeds that of black smooth hair at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d709a96b0d4d8ee6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) floral cotton dress at center (B) green cotton shirt at center (C) white sandcastle at center" }, { "from": "gpt", "value": "(A) floral cotton dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64e72152e2c03fad.jpg", "conversations": [ { "from": "human", "value": "\nIs clear water at center further to camera compared to green matte tree at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of green matte tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ad4adbf00e91189.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.135, 0.511) (B) (0.499, 0.950) (C) (0.660, 0.822) (D) (0.909, 0.575)" }, { "from": "gpt", "value": "(A) (0.135, 0.511)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9301564f95715fe5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.828, 0.222) (B) (0.655, 0.470)" }, { "from": "gpt", "value": "(A) (0.828, 0.222)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f53851f88739a3e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) silver metallic rail at lower center (B) white fabric shirt at center, is positioned farthest from the blue fabric jacket at center?" }, { "from": "gpt", "value": "(A) silver metallic rail at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/725bb473d316eb0b.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden table at center above blue fleece sweatshirt at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, wooden table at center is not positioned above blue fleece sweatshirt at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/561fdda370485d54.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic chrome rearview mirror at center smaller than asphalt road at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, metallic chrome rearview mirror at center occupies less space than asphalt road at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea3bb4151040820c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white marble fountain at lower right (B) beige stone building at center" }, { "from": "gpt", "value": "(A) white marble fountain at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/af22d81e2cb87e48.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of bare branches at left and brown dirt track at left in the image provided, where is bare branches at left located with respect to brown dirt track at left? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f86be0f0a475eb09.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white metallic ski at center (B) white snow at center" }, { "from": "gpt", "value": "(A) white metallic ski at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb493356805965c8.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent plastic balloon at upper left appear on the right side of matte black shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, transparent plastic balloon at upper left is not to the right of matte black shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a54624f495541b8.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the white soft fabric baby at center? (A) blue fabric jacket at center (B) printed fabric shawl at center" }, { "from": "gpt", "value": "(B) printed fabric shawl at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0a71d141d280b6f.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden fence at left smaller than yellow plastic boat at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, wooden fence at left might be larger than yellow plastic boat at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf2e7fd5828ae13d.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray t-shirt at center below blue denim jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, dark gray t-shirt at center is positioned under blue denim jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8d54953d0932d35.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte shirt at right further to camera compared to dark blue wetsuit at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f4bd14ff9d72f27.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden deck at right appear on the right side of rustic wood hut at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, wooden deck at right is to the right of rustic wood hut at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3fdbdb2a412df0f4.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the blue fabric life jacket at center? Choose from: (A) blue fabric life jacket at lower right (B) blue fabric life jacket at left" }, { "from": "gpt", "value": "(B) blue fabric life jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f0c9744c5e0c029d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte gray shirt at center (B) shaggy brown dog at center" }, { "from": "gpt", "value": "(A) matte gray shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcdb538bf4dc5b75.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the black matte shorts at center? Select from: (A) matte black hair at upper center (B) smooth gray rock at center (C) matte black hand at upper center (D) black fabric shorts at center" }, { "from": "gpt", "value": "(C) matte black hand at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/719f43e8a40b6982.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) white glass building at center (B) brown glassy building at upper center" }, { "from": "gpt", "value": "(A) white glass building at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/452d469272d4b209.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) matte blue backpack at center (B) silver metallic pole at center" }, { "from": "gpt", "value": "(A) matte blue backpack at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0f6a3c803ba5fd8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the plaid shirt at center? Choose among these: (A) white cotton t-shirt at left (B) denim jacket at center (C) smooth white t-shirt at center" }, { "from": "gpt", "value": "(B) denim jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77b4a5612cee3c13.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the wooden table at lower right? Choose from: (A) wooden photo frame at lower right (B) black plastic lamp at lower right" }, { "from": "gpt", "value": "(B) black plastic lamp at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0564ea0a5e97b2f3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte brown fabric skull at center is bigger than white shirt at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte brown fabric skull at center is not larger than white shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04b179624606c7bb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper left is positioned below green leafy tree at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, green leafy tree at upper left is above green leafy tree at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1134ccbfff7fe96.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white t-shirt at center is positioned to the right of matte black jacket at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white t-shirt at center is positioned on the right side of matte black jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8de0730e016a162c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if purple cotton shirt at right is wider than blonde hair at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, purple cotton shirt at right is wider than blonde hair at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd7360e52294114c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.423, 0.139) (B) (0.365, 0.242) (C) (0.575, 0.263) (D) (0.800, 0.666)" }, { "from": "gpt", "value": "(D) (0.800, 0.666)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43ff13fa64542219.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.653, 0.614) (B) (0.856, 0.938) (C) (0.168, 0.802) (D) (0.494, 0.545)" }, { "from": "gpt", "value": "(C) (0.168, 0.802)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/13f2fc5d64f003e9.jpg", "conversations": [ { "from": "human", "value": "\nDoes beige plastic atari 400 at center come behind beige plastic atari 410 at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46f1fa1e74b5ec53.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte window at center is bigger than blue fabric figure at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, white matte window at center is larger in size than blue fabric figure at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41f6d110cb7d0e39.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) metallic red table at center (B) black plastic monitor at center" }, { "from": "gpt", "value": "(B) black plastic monitor at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b66c9a09d95b5468.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.404, 0.938) (B) (0.376, 0.780) (C) (0.804, 0.586)" }, { "from": "gpt", "value": "(C) (0.804, 0.586)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7e20795613d567d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the bright yellow light at center? Choose among these: (A) bright yellow starburst at upper center (B) matte glass storefront at center" }, { "from": "gpt", "value": "(B) matte glass storefront at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2259baf80b08ec46.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.154, 0.966) (B) (0.466, 0.489) (C) (0.833, 0.766)" }, { "from": "gpt", "value": "(A) (0.154, 0.966)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f2d3a56278e28c87.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) plaid shirt at center (B) plaid cotton shirt at center" }, { "from": "gpt", "value": "(B) plaid cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c56bc8016f398ef.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) black glossy dog at left (B) shiny golden dog at center" }, { "from": "gpt", "value": "(A) black glossy dog at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/510e26218e24680b.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue water at center appear under green leafy trees at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, blue water at center is above green leafy trees at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e7a24e3e8d951832.jpg", "conversations": [ { "from": "human", "value": "\nIs white glass storefront at center smaller than matte glass mannequins at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, white glass storefront at center might be larger than matte glass mannequins at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e9d0cdb2de12249.jpg", "conversations": [ { "from": "human", "value": "\nIs green textured mountain at upper right behind black fabric paddleboard at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/233287dffee0bde8.jpg", "conversations": [ { "from": "human", "value": "\nDoes green fabric bag at center have a lesser width compared to blue denim jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green fabric bag at center's width is less than blue denim jacket at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/504aae64a715586b.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white printed t-shirt at right located relative to light blue shirt at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6862bdadb2f43a64.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) matte red shirt at right (B) translucent glass at left, is positioned farthest from the orange knitted sweater at center?" }, { "from": "gpt", "value": "(B) translucent glass at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ddf0c51571f57e44.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) white shirt at center (B) pink silk tie at center (C) black pinstripe suit at center" }, { "from": "gpt", "value": "(C) black pinstripe suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68e75a4590e586e3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.432, 0.477) (B) (0.513, 0.730) (C) (0.312, 0.497) (D) (0.202, 0.480)" }, { "from": "gpt", "value": "(D) (0.202, 0.480)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d9701aace228d96.jpg", "conversations": [ { "from": "human", "value": "\nIs silhouette metal bicycle at center above smooth metal bicycle wheel at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, silhouette metal bicycle at center is located above smooth metal bicycle wheel at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1b1624e76936951c.jpg", "conversations": [ { "from": "human", "value": "\nIs smooth bark tree at right positioned before metallic silver car at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b89b3e0815b072af.jpg", "conversations": [ { "from": "human", "value": "\nDoes lime green fabric bean bag at lower left have a lesser width compared to green fabric bean bag at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, lime green fabric bean bag at lower left's width is not less than green fabric bean bag at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75c1a68c78bfec8e.jpg", "conversations": [ { "from": "human", "value": "\nIs light green sheer dress at center in front of velvet gold dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c201b93d52e1278.jpg", "conversations": [ { "from": "human", "value": "\nIs satin blue car at center wider than shiny red car at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, satin blue car at center has a greater width compared to shiny red car at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cd57c483e0121b6.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte toothbrush at center have a greater width compared to yellow fabric lanyard at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a63bb1e58311cab.jpg", "conversations": [ { "from": "human", "value": "\nDoes teal matte shirt at center have a smaller size compared to striped sweater at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, teal matte shirt at center occupies less space than striped sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b59e6629c556369.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the dark gray scarf at right? Choose among these: (A) dark brown hair at lower center (B) dark blue jacket at center (C) green matte sweater at upper left" }, { "from": "gpt", "value": "(A) dark brown hair at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c4d59e439049697.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.246, 0.023) (B) (0.542, 0.497)" }, { "from": "gpt", "value": "(B) (0.542, 0.497)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0b51806eca98646.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) red silk tie at center (B) dark gray smooth hand at center" }, { "from": "gpt", "value": "(B) dark gray smooth hand at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b3fa9ba267b5abe.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the green painted wood boat at upper right? Select from: (A) matte black swan at center (B) matte black swan at upper left" }, { "from": "gpt", "value": "(B) matte black swan at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fe08de435fe0fb9a.jpg", "conversations": [ { "from": "human", "value": "\nIs gray fabric at center further to the viewer compared to gray fabric headscarf at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of gray fabric headscarf at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fee921653c665ee8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.511, 0.459) (B) (0.701, 0.597) (C) (0.246, 0.747)" }, { "from": "gpt", "value": "(C) (0.246, 0.747)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5447a63be1a51660.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of wooden window at center in reference to green matte door at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f1b7b339a554756.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.792, 0.716) (B) (0.360, 0.053) (C) (0.280, 0.542)" }, { "from": "gpt", "value": "(B) (0.360, 0.053)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b9bedc8856a76253.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.341, 0.567) (B) (0.367, 0.686) (C) (0.683, 0.470)" }, { "from": "gpt", "value": "(C) (0.683, 0.470)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abf80f2d0372a804.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.113, 0.864) (B) (0.294, 0.602)" }, { "from": "gpt", "value": "(A) (0.113, 0.864)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d270f46c74a745f6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) blue jacket at left (B) black fleece jacket at center" }, { "from": "gpt", "value": "(A) blue jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8d73135be7999c70.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the blue striped shirt at upper right? Choose among these: (A) dark blue striped shirt at lower center (B) matte gray shirt at left" }, { "from": "gpt", "value": "(B) matte gray shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7bd677e58dd92fb0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.297, 0.894) (B) (0.690, 0.327)" }, { "from": "gpt", "value": "(A) (0.297, 0.894)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8bddc870ef9a433.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the brown matte pretzel at center? Choose among these: (A) brown matte snack at center (B) matte plastic snack tray at center" }, { "from": "gpt", "value": "(A) brown matte snack at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e103e097c6eb744.jpg", "conversations": [ { "from": "human", "value": "\nIs blue rubber water bottle at center thinner than clear plastic bottle at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e23023ad2f1175e3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if camouflage jacket at left is positioned to the left of camouflage jacket at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, camouflage jacket at left is positioned on the left side of camouflage jacket at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6011e6c1134d0a35.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green grass at center located in relation to brown rough stone at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5978086751cf7eb2.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.358, 0.678) (B) (0.382, 0.616) (C) (0.989, 0.480)" }, { "from": "gpt", "value": "(C) (0.989, 0.480)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cde169434930f92d.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of yellow sleeveless shirt at left in reference to red and blue cotton shirt at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/65bdff2294241bf9.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange matte motorcycle at center have a lesser width compared to black matte motorcycle at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, orange matte motorcycle at center's width is not less than black matte motorcycle at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f89b2864a506a00d.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the matte black sunglasses at center? Choose from: (A) matte black shirt at center (B) red synthetic jacket at center (C) denim jeans at center" }, { "from": "gpt", "value": "(B) red synthetic jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bda5df5e114ae26.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) red matte flower pot at center (B) bright red flowers at center" }, { "from": "gpt", "value": "(B) bright red flowers at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a6814bc0742845a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) brown sandy dirt field at center (B) white smooth tree trunk at left" }, { "from": "gpt", "value": "(B) white smooth tree trunk at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/248daf16bb6bef2b.jpg", "conversations": [ { "from": "human", "value": "\nIs brown matte robe at center to the left of green leafy palm tree at upper right from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find brown matte robe at center to the left of green leafy palm tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7714cdeda859ce1a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black wool suit at right is positioned to the right of black matte dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, black wool suit at right is positioned on the right side of black matte dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89c9a2bda3c0f53d.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown striped sweater at center appear under pink striped sweater at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, brown striped sweater at center is above pink striped sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e23790a6f2e9850.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) spotted fur fawn at lower right (B) brown gravel path at center" }, { "from": "gpt", "value": "(B) brown gravel path at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66fb2057ed751e9c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) light blue fabric at center (B) light gray cotton sweater at center (C) blue fabric basket at center" }, { "from": "gpt", "value": "(C) blue fabric basket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/153c4b174469f63d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.560, 0.367) (B) (0.316, 0.544)" }, { "from": "gpt", "value": "(B) (0.316, 0.544)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6473fe8d10060823.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is golden leaves at upper right located relative to light gray stone bell tower at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1fb5a1573ffef946.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white paper sign at center located relative to matte black sunglasses at lower left? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/74aa07bd72d4e551.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.477, 0.592) (B) (0.780, 0.728)" }, { "from": "gpt", "value": "(B) (0.780, 0.728)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58ff38f217876594.jpg", "conversations": [ { "from": "human", "value": "\nIs white dotted scarf at lower left smaller than matte black head at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white dotted scarf at lower left is not smaller than matte black head at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/822fd35e44f1d1e2.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue matte board at upper right lie in front of white plastic table at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/176faac080bef0b7.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) smooth plastic seat at center (B) smooth gray rock at lower center (C) shiny red kayak at lower center (D) clear water at center" }, { "from": "gpt", "value": "(B) smooth gray rock at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43cc17199c369bf8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.639, 0.716) (B) (0.040, 0.578)" }, { "from": "gpt", "value": "(B) (0.040, 0.578)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7b79617f04172691.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green led scoreboard at upper center (B) white leather jacket at left" }, { "from": "gpt", "value": "(A) green led scoreboard at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20fc500e2351fb89.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dark wood dock at lower center (B) wooden boat at left (C) metallic silver boat at lower right (D) glistening water at center" }, { "from": "gpt", "value": "(B) wooden boat at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f46e6a7e066d246.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the dark brown leather jacket at left? Choose from: (A) white fabric flag at center (B) gold metallic trike at left (C) white fabric flag at upper left (D) polished chrome trike at center" }, { "from": "gpt", "value": "(C) white fabric flag at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97254c17b0a76f97.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) brown and white fur dog at center (B) white metal bench at center" }, { "from": "gpt", "value": "(A) brown and white fur dog at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbef3bbaeb765847.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the wooden rail at center? Select from: (A) wooden bridge at center (B) beige sandy beach at center" }, { "from": "gpt", "value": "(B) beige sandy beach at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/127ec23465fa91fc.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny brown crocodile at center have a greater width compared to white plastic fishing pole at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1232c1ae0f8fe836.jpg", "conversations": [ { "from": "human", "value": "\nIs pink floral dress at center thinner than matte red shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc8e9ad9d3d6e4a4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.374, 0.689) (B) (0.389, 0.373) (C) (0.866, 0.522)" }, { "from": "gpt", "value": "(A) (0.374, 0.689)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1df8d632bf4a2fd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.498, 0.581) (B) (0.605, 0.061)" }, { "from": "gpt", "value": "(A) (0.498, 0.581)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35462c12af997c4c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) dark blue shirt at right (B) light gray jacket at center (C) matte black speaker at left (D) metallic silver speaker at upper right" }, { "from": "gpt", "value": "(A) dark blue shirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e99f3410f35fd9e3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the leather boots at lower center? Choose among these: (A) brown suede boot at lower center (B) white-spotted fur dog at right" }, { "from": "gpt", "value": "(A) brown suede boot at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01cfe6a5503e0120.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent water at center bigger than green leafy trees at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, transparent water at center is not larger than green leafy trees at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3473ad8fe2218a99.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white powdery snow at lower center located in relation to brick building at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f4feeb36b4d5b40.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) matte brown hand at lower left (B) matte brown statue at center" }, { "from": "gpt", "value": "(B) matte brown statue at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03521e09321cf595.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth wood table at center appear on the left side of black matte desk lamp at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, smooth wood table at center is to the left of black matte desk lamp at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0225db1401b775a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at upper left is thinner than green leafy tree at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, green leafy tree at upper left might be wider than green leafy tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27743e87173c33a5.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the white matte hand at lower center from the following options: (A) smooth white hand at center (B) white plastic cup at center?" }, { "from": "gpt", "value": "(B) white plastic cup at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/24211e4d64396d50.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the red/white striped pole at center? Choose among these: (A) white plastic license plate at center (B) matte blue car at left (C) metallic silver pole at center" }, { "from": "gpt", "value": "(A) white plastic license plate at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2ac60621ec11d85.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the pink cotton shirt at center? Select from: (A) brown textured suit at center (B) houndstooth fabric jacket at left" }, { "from": "gpt", "value": "(A) brown textured suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d33f737993af31f6.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte sneaker at lower center thinner than white rubber shoe at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white matte sneaker at lower center's width is not less than white rubber shoe at lower center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ecebc33a428a44a.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center have a larger size compared to bare branches at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green leafy tree at center is not larger than bare branches at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca8fc2b6bc29e744.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte jacket at center below white fabric helmet at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/03a0dee6a3c5a2f6.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown wooden train track at lower right appear under white glossy train at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, brown wooden train track at lower right is positioned under white glossy train at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e01991096c60fdd.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) teal metallic car at center (B) white matte t-shirt at center (C) matte black car trunk at left, is positioned farthest from the brown fabric tent at center?" }, { "from": "gpt", "value": "(A) teal metallic car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5ce9debc190542aa.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) gray fabric tank top at center (B) brown leather belt at lower center (C) white fabric dress at upper right (D) matte white toga at upper right" }, { "from": "gpt", "value": "(A) gray fabric tank top at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d01425e103774868.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the blue metallic car at left? Select from: (A) yellow reflective jacket at center (B) metallic blue sedan at left" }, { "from": "gpt", "value": "(B) metallic blue sedan at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca41446b7c911053.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.679, 0.497) (B) (0.867, 0.192)" }, { "from": "gpt", "value": "(A) (0.679, 0.497)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fcdf0318103218c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if beige suit at center is wider than dark gray suit at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, beige suit at center is wider than dark gray suit at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3d641274037988a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue water at center is smaller than green leafy tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, blue water at center is smaller than green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/99340bc66fabe25a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.497, 0.908) (B) (0.936, 0.767)" }, { "from": "gpt", "value": "(A) (0.497, 0.908)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5eb4085f1cfe7554.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue tarpaulin canopy at upper center appear on the left side of matte black chairs at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, blue tarpaulin canopy at upper center is to the left of matte black chairs at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61a71bd8eb4c8dd9.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of glistening water at center in reference to black straw umbrella at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29249d4fdbc61056.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.721, 0.945) (B) (0.263, 0.791)" }, { "from": "gpt", "value": "(B) (0.263, 0.791)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c20568aa02bdb91e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark reflective water at center is positioned to the left of white matte sailboat at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, dark reflective water at center is not on the left side of white matte sailboat at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4cbfae801a54f5b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) clear water at boat right (B) wooden sailboat at center" }, { "from": "gpt", "value": "(A) clear water at boat right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9e0b36ba67bed822.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the matte floral shoe at center among (A) floral fabric shoe at center (B) matte floral shoe at upper center?" }, { "from": "gpt", "value": "(B) matte floral shoe at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3740908f1206d243.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white frothy wave at center located in relation to blue fabric shirt at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba9dbc4fb4153ff6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) brown wooden chair at lower center (B) dark brown wood bookcase at left" }, { "from": "gpt", "value": "(A) brown wooden chair at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dbc610e6a0b4c462.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) matte red robe at center (B) matte red toga at center (C) smooth asphalt pavement at lower center" }, { "from": "gpt", "value": "(C) smooth asphalt pavement at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/200d1bb5d7cd9d78.jpg", "conversations": [ { "from": "human", "value": "\nIs matte brown leggings at center above brown smooth leggings at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e427c97675a17869.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the dark green foliage at left? Choose among these: (A) dark grass at center (B) brown textured tree at right (C) silhouette bare trees at center (D) bare branches at upper right" }, { "from": "gpt", "value": "(B) brown textured tree at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28b978351e2c0ead.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of matte red lantern at left more distant than that of matte red lantern at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte red lantern at left is further from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ac34b0b2887caf5.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny plastic apple at left behind matte black laptop at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, shiny plastic apple at left is in front of matte black laptop at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e9362f3f7386093c.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown rough bark tree at left appear on the right side of camouflage uniform at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, brown rough bark tree at left is to the left of camouflage uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cda7ae3782eeb070.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green leafy tree at left in relation to smooth gray rock at upper center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e729504f08654f10.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden table at center is positioned below golden cracker at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e459c834b48d86a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white wrought iron balcony at center is positioned to the left of silver shiny trumpet at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find white wrought iron balcony at center to the left of silver shiny trumpet at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e448125517a58148.jpg", "conversations": [ { "from": "human", "value": "\nIs white floral dress at center wider than black plastic sunglasses at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3acad5873e7d5507.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden frame at upper center is positioned to the left of matte yellow armchair at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find wooden frame at upper center to the left of matte yellow armchair at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3187f4cab29e1aed.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) brushed metal towel bar at upper left (B) white glossy bathtub at lower left (C) white glossy toilet at lower right" }, { "from": "gpt", "value": "(C) white glossy toilet at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a0201a794da3fff.jpg", "conversations": [ { "from": "human", "value": "\nIs blue denim jeans at center bigger than striped cotton shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, blue denim jeans at center is larger in size than striped cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6c22002cfa8777b9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) light gray fleece jacket at left (B) matte black coat at center (C) metallic silver train at center" }, { "from": "gpt", "value": "(A) light gray fleece jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3df4b5c6ec0af055.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.027, 0.270) (B) (0.925, 0.284) (C) (0.454, 0.466) (D) (0.675, 0.266)" }, { "from": "gpt", "value": "(C) (0.454, 0.466)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15d69d6e8358f821.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the dark blue shirt at center? (A) dark gray sweater at lower left (B) striped polo shirt at lower right (C) white fabric at upper center" }, { "from": "gpt", "value": "(B) striped polo shirt at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/884e02720d562247.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.742, 0.334) (B) (0.292, 0.931) (C) (0.279, 0.403)" }, { "from": "gpt", "value": "(C) (0.279, 0.403)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1cd9e4c3e0ab1a85.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) camouflage fabric uniform at center (B) camouflage fabric rifle at center" }, { "from": "gpt", "value": "(A) camouflage fabric uniform at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41426925a54f7802.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white matte truck at center located relative to white tile pavement at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec7b5b9262d6e96a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.406, 0.505) (B) (0.791, 0.520)" }, { "from": "gpt", "value": "(B) (0.791, 0.520)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a304c6141e219a89.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) black matte video camera at lower left (B) dark suit at center" }, { "from": "gpt", "value": "(A) black matte video camera at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/005fb5ab66f84caf.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the matte white shirt at left? Choose from: (A) white matte vest at center (B) silky white tie at center" }, { "from": "gpt", "value": "(B) silky white tie at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7498861d5dbfa33.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.592, 0.739) (B) (0.328, 0.741)" }, { "from": "gpt", "value": "(B) (0.328, 0.741)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32bb540b60bad41e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) silver foil wrapped butter at left (B) white creamy butter at center" }, { "from": "gpt", "value": "(A) silver foil wrapped butter at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95be5b9a8b2d9aa4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) black plastic sony ericsson at center (B) black plastic keypad at lower center" }, { "from": "gpt", "value": "(A) black plastic sony ericsson at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7474eace567fea61.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.813, 0.558) (B) (0.246, 0.397) (C) (0.298, 0.764) (D) (0.883, 0.919)" }, { "from": "gpt", "value": "(D) (0.883, 0.919)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15c1c556f790b07f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) wooden table at center (B) red silk tie at center (C) matte black suit at center (D) black plastic microphone at center" }, { "from": "gpt", "value": "(A) wooden table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01ba25ece87db55f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) smooth wooden ship at right (B) smooth wooden ship at center (C) smooth wooden ship at left (D) smooth wood bench at lower center" }, { "from": "gpt", "value": "(D) smooth wood bench at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9659e3eaecd4f1a4.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden at right is wider than black fabric at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, wooden at right's width does not surpass black fabric at lower right's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f9d71707626453da.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the satin silver sedan at lower right among (A) green leafy tree at center (B) black wire at upper center (C) green textured tree at right?" }, { "from": "gpt", "value": "(C) green textured tree at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2b238ec564bebcc.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.730, 0.794) (B) (0.503, 0.578)" }, { "from": "gpt", "value": "(B) (0.503, 0.578)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/58cff6f1b6017aa7.jpg", "conversations": [ { "from": "human", "value": "\nIs denim jeans at lower left thinner than denim jeans at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, denim jeans at lower left might be wider than denim jeans at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25f21a53c5069788.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the white glossy sedan at center? (A) white matte car at lower right (B) blue satin dress at center (C) metallic blue suv at center (D) brown dirt track at center" }, { "from": "gpt", "value": "(A) white matte car at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f60de7c1e5f63d83.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the red/yellow shirt at center? (A) gray concrete wall at center (B) red shirt at center" }, { "from": "gpt", "value": "(B) red shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e27976ca703304c3.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown furry dog at center is smaller than clear glass window at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, brown furry dog at center is not smaller than clear glass window at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36762b81e063d664.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) gold sequined dress at center (B) shiny black suit at center" }, { "from": "gpt", "value": "(B) shiny black suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0784c357510baac0.jpg", "conversations": [ { "from": "human", "value": "\nDoes patterned fabric dress at upper center appear over matte black turtle at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0bb58c04aac2f9c.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the yellow satin dress at center among (A) velvet blue coat at right (B) white satin dress at center left (C) white satin dress at upper left (D) white paper plate at lower left?" }, { "from": "gpt", "value": "(A) velvet blue coat at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4f125d98f717e527.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if wooden table at center is positioned to the right of rusty metallic phone at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, wooden table at center is not on the right side of rusty metallic phone at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2648b4cf7e98470.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte gray t-shirt at center is wider than wooden paneling at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f061116999624d23.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the white plastic boat at center? (A) brown sandy beach at lower center (B) cloudy sky at center" }, { "from": "gpt", "value": "(A) brown sandy beach at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/909ffca4871d06f6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow matte sunflower at center is wider than green bamboo stem at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, yellow matte sunflower at center is wider than green bamboo stem at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75f090422d60265d.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black phone at center wider than floral fabric shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte black phone at center is wider than floral fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c60f2113ca4aa8a2.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.712, 0.492) (B) (0.640, 0.822) (C) (0.108, 0.327)" }, { "from": "gpt", "value": "(C) (0.108, 0.327)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3fb29e38c6b1e32.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.754, 0.581) (B) (0.432, 0.475)" }, { "from": "gpt", "value": "(B) (0.432, 0.475)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60cb02a4afcbb4da.jpg", "conversations": [ { "from": "human", "value": "\nIs transparent plastic table at center to the left of green rubber beach ball at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, transparent plastic table at center is positioned on the left side of green rubber beach ball at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adae3b58f7c35092.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green leafy tree at center (B) green leafy tree at upper center (C) green needle-like branches at upper left" }, { "from": "gpt", "value": "(C) green needle-like branches at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc250be0a5d73407.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white cotton flag at upper right located relative to dark gray fabric coat at lower left? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57b949f178ffe558.jpg", "conversations": [ { "from": "human", "value": "\nIs green textured bush at center closer to the viewer compared to white stone sculpture at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of white stone sculpture at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1790017b26f9d5f0.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the matte gray t-shirt at center among (A) metallic steel bars at center (B) golden fur lion at left?" }, { "from": "gpt", "value": "(B) golden fur lion at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c261a85917aefb49.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of wooden signboard at upper center in relation to multicolored woven tie at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/610cfe865402a892.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.926, 0.353) (B) (0.275, 0.248) (C) (0.349, 0.645)" }, { "from": "gpt", "value": "(A) (0.926, 0.353)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/776d8c4c8b1b6172.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) wooden board at center (B) light brown wood board at center (C) red cotton t-shirt at right (D) birch plywood at center" }, { "from": "gpt", "value": "(A) wooden board at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3984efdb4b285e62.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if teal matte vest at center is smaller than white matte snowboard at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, teal matte vest at center is not smaller than white matte snowboard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6faa518e322bdfd1.jpg", "conversations": [ { "from": "human", "value": "\nIs white creamy cake at center above yellow matte popcorn at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white creamy cake at center is not above yellow matte popcorn at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3ddb1d5f8f44c1e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) black matte shirt at center (B) blue glossy antelope at upper right" }, { "from": "gpt", "value": "(A) black matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47d9775f480344e2.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of dark blue water at center in reference to white smoke at upper center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53fe82e6cc2780db.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.057, 0.205) (B) (0.589, 0.889)" }, { "from": "gpt", "value": "(B) (0.589, 0.889)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d05c2c22b4b327dd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.041, 0.186) (B) (0.697, 0.402)" }, { "from": "gpt", "value": "(A) (0.041, 0.186)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd8ed6ec6fef8160.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of dark brown leather jacket at center in reference to matte brown hair at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62e7d10e695cfd3d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.586, 0.495) (B) (0.063, 0.361) (C) (0.420, 0.381)" }, { "from": "gpt", "value": "(B) (0.063, 0.361)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ed0997e8dd74671.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the gold metallic pole at left? Choose from: (A) silver metallic guardrail at lower right (B) silver metallic pole at left" }, { "from": "gpt", "value": "(A) silver metallic guardrail at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77147ed5f02c1b16.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of black matte/leather jacket at center and matte blue costume at lower left in the image provided, where is black matte/leather jacket at center located with respect to matte blue costume at lower left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/51ad7783b4548f99.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black dress at left is positioned to the right of clear glass wine at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black dress at left is not to the right of clear glass wine at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/10fc107d0be71e7e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the matte orange plush toy at lower left? (A) white plush toy at center (B) matte yellow plush toy at lower left" }, { "from": "gpt", "value": "(B) matte yellow plush toy at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73ac5543f6b9e3c0.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.540, 0.395) (B) (0.578, 0.789)" }, { "from": "gpt", "value": "(B) (0.578, 0.789)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/614efd5fdd3d80fe.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark blue suit at right is smaller than peachy fabric jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, dark blue suit at right might be larger than peachy fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d488671c3197412.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) yellow matte shirt at center (B) white painted wood cart at center (C) shiny chrome motorcycle at left (D) light blue shirt at left" }, { "from": "gpt", "value": "(A) yellow matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b883491ff915874.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.910, 0.795) (B) (0.838, 0.592)" }, { "from": "gpt", "value": "(A) (0.910, 0.795)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/026cde425ea95a4d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) spotted fur snow leopard at center (B) green leafy grass at lower left (C) wire mesh fence at upper center" }, { "from": "gpt", "value": "(C) wire mesh fence at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/efc7ea72e7aa1531.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the wooden table at lower left? Choose from: (A) blue paperback book at lower left (B) black and white fur at center" }, { "from": "gpt", "value": "(B) black and white fur at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdb804953c8b4528.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.208, 0.772) (B) (0.471, 0.730)" }, { "from": "gpt", "value": "(B) (0.471, 0.730)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b737e5b840037416.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte pink fabric hat at center (B) clear glass window at center (C) polka dot fabric hat at center" }, { "from": "gpt", "value": "(B) clear glass window at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cfc4ef10696e177.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown wooden rail at right have a larger size compared to white sheer curtain at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, brown wooden rail at right is larger in size than white sheer curtain at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9cbfbca5c789219f.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny black car at center have a greater width compared to dark gray uniform at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of shiny black car at center exceeds that of dark gray uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d5e94398ee18785.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center have a larger size compared to orange cotton shirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green grass at center is larger in size than orange cotton shirt at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8186c3a66829a22b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) dark brown fuzzy beard at center (B) white matte uniform at right (C) white fabric chef coat at left" }, { "from": "gpt", "value": "(C) white fabric chef coat at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e51a34cb7131e6e2.jpg", "conversations": [ { "from": "human", "value": "\nWhere is rusty corrugated metal hut at center located in relation to blue striped shirt at lower center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b64386d65843f294.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink satin dress at center have a greater width compared to shiny satin blouse at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, pink satin dress at center is wider than shiny satin blouse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/673ab9db97782509.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) black matte shirt at center (B) camouflage fabric uniform at left" }, { "from": "gpt", "value": "(B) camouflage fabric uniform at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/55b2b0b2a74f0740.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) shiny metallic jacket at center (B) shiny metallic helmet at center" }, { "from": "gpt", "value": "(B) shiny metallic helmet at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd479b8ebad676a9.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange matte jacket at center have a lesser width compared to matte black camera at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, orange matte jacket at center might be wider than matte black camera at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34ea7172154ae502.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of green glossy water at center in reference to green leafy tree at upper center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12e7bb8c02ee70c5.jpg", "conversations": [ { "from": "human", "value": "\nDoes woven rattan lounge chair at center appear on the left side of woven rattan chair at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, woven rattan lounge chair at center is to the right of woven rattan chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8960553f3f2e4603.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green wood field at center located in relation to wooden picnic table at lower left in the image? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1779fce8c0e3a035.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) wooden fence at center (B) white fabric tent at center" }, { "from": "gpt", "value": "(B) white fabric tent at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ebb6aa30a29c648d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) green matte tree at center (B) yellow plastic tree at right (C) green leafy trees at left" }, { "from": "gpt", "value": "(A) green matte tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1a783f7f069c787a.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center appear over green leafy tree at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green leafy tree at center is above green leafy tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ed42d1d740c5563.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if silver metallic laptop at center is positioned below sleek silver laptop at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5d41662f2c3d54d0.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at lower left above brown leafless tree at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green grass at lower left is not above brown leafless tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/26b787e7ae019820.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) beige concrete building at right (B) glassy steel skyscraper at center (C) dark glass skyscraper at center, is positioned farthest from the shiny glass tower at center?" }, { "from": "gpt", "value": "(A) beige concrete building at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/090be286e8a055d4.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte sign at center below red led pedestrian signal at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/91538f3310d462d0.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) smooth beige blouse at upper center (B) dark suit at center" }, { "from": "gpt", "value": "(B) dark suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba65b4304f691abb.jpg", "conversations": [ { "from": "human", "value": "\nDoes metallic red crane at right come in front of blue plastic sign at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, metallic red crane at right is behind blue plastic sign at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/033209daf5335544.jpg", "conversations": [ { "from": "human", "value": "\nIs silver metallic bicycle at center to the left of blue fabric jacket at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find silver metallic bicycle at center to the left of blue fabric jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6854ce4cbc9f92ce.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) white matte/soft fabric at center (B) white matte dress at center" }, { "from": "gpt", "value": "(B) white matte dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7de4a29626b5951.jpg", "conversations": [ { "from": "human", "value": "\nDoes purple fleece blanket at center appear on the right side of orange fleece jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, purple fleece blanket at center is to the right of orange fleece jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb1465315f29d095.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte brown jacket at left in relation to smooth leather gloves at center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01375c81e3f3627b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if beige sand at center is bigger than white floral dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, beige sand at center is larger in size than white floral dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3dd3d53d11e1910d.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver metallic suv at center appear under green leafy tree at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, silver metallic suv at center is below green leafy tree at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6861653028b14bad.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) blue water at center (B) white glossy boat at left" }, { "from": "gpt", "value": "(A) blue water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20abe22cf606f408.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the green striped polo shirt at center? Choose from: (A) gray concrete pavement at center (B) matte orange shirt at center" }, { "from": "gpt", "value": "(B) matte orange shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fd10912313fb2361.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center have a greater width compared to dark brown fabric pants at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green grass at center has a greater width compared to dark brown fabric pants at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/094b5dc455cb4efe.jpg", "conversations": [ { "from": "human", "value": "\nIs satin silver fork at center to the right of matte silver spoon at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, satin silver fork at center is not on the right side of matte silver spoon at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9341c6ed164ae11f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.104, 0.958) (B) (0.722, 0.902)" }, { "from": "gpt", "value": "(A) (0.104, 0.958)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4ae24cbd2a1d20c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the blue striped shirt at center? Choose among these: (A) blue glass at center (B) blue denim jeans at left" }, { "from": "gpt", "value": "(B) blue denim jeans at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c91e0833da172c6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte green t-shirt at center is positioned to the right of red matte strawberry at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte green t-shirt at center is not on the right side of red matte strawberry at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12186330b4865f21.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.401, 0.639) (B) (0.270, 0.820) (C) (0.770, 0.697)" }, { "from": "gpt", "value": "(B) (0.270, 0.820)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45a496b34f89d182.jpg", "conversations": [ { "from": "human", "value": "\nDoes white plastic railroad crossing sign at upper left appear under red matte traffic light at center right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c8530a0876b1ed8.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.230, 0.747) (B) (0.406, 0.811)" }, { "from": "gpt", "value": "(B) (0.406, 0.811)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0dd9d691d3e5dd46.jpg", "conversations": [ { "from": "human", "value": "\nDoes white smooth column at right have a larger size compared to white smooth column at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white smooth column at right has a larger size compared to white smooth column at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d2ab2537d3944e23.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the orange fabric tent at upper right among (A) gray/white fabric tent at center (B) blue cotton shirt at center (C) green canvas tent at upper center (D) green fabric tent at lower right?" }, { "from": "gpt", "value": "(A) gray/white fabric tent at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0347059fc129d407.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy hedge at upper left is smaller than matte black purse at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, green leafy hedge at upper left is not smaller in size than matte black purse at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ee9ed7afddf7a137.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the clear plastic bottle at table? Select from: (A) light blue cotton shirt at lower right (B) pink cotton shirt at center" }, { "from": "gpt", "value": "(B) pink cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3fca14493493f8e.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the wooden table at lower right? (A) matte gray shirt at center (B) plaid shirt at right" }, { "from": "gpt", "value": "(B) plaid shirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00df5792e4489aa0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) matte brown leather hat at center (B) brown leather baseball hat at upper center (C) matte gray cap at center (D) black matte baseball cap at upper center" }, { "from": "gpt", "value": "(C) matte gray cap at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f7745c26ee4ccba3.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black suit at center further to camera compared to white ribbed sweater at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte black suit at center is in front of white ribbed sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc0bd252590a5c40.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) matte black guitar at center (B) matte acoustic guitar at left (C) matte black guitar at left" }, { "from": "gpt", "value": "(B) matte acoustic guitar at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2bba7f3daf3dc07.jpg", "conversations": [ { "from": "human", "value": "\nIs white plastic table at center above black plastic smartphone at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white plastic table at center is above black plastic smartphone at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9991b2504fdbad9d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) metallic saw at center (B) smooth wooden plank at lower center (C) white matte dress at center" }, { "from": "gpt", "value": "(B) smooth wooden plank at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0bafb9387e91b41.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte red hat at lower left is wider than matte red fez at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of matte red hat at lower left exceeds that of matte red fez at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/126de181b518a09d.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black shirt at center to the right of white paper at left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black shirt at center is to the right of white paper at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0e6cc3433e6f5bc2.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.424, 0.644) (B) (0.445, 0.402) (C) (0.764, 0.916)" }, { "from": "gpt", "value": "(C) (0.764, 0.916)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2c4afaa55f3502cd.jpg", "conversations": [ { "from": "human", "value": "\nDoes white glossy surfboard at left lie behind white smooth surfboard at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is behind white smooth surfboard at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d07700f1d13e36ab.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if rubber textured basketball at center is positioned to the left of rubber textured basketball at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find rubber textured basketball at center to the left of rubber textured basketball at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b648d2515ad0f70a.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of light yellow shirt at center and shiny blue suit at stage left in the image provided, where is light yellow shirt at center located with respect to shiny blue suit at stage left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cebd1057921c7035.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.638, 0.333) (B) (0.093, 0.347)" }, { "from": "gpt", "value": "(B) (0.093, 0.347)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/876086fd507167f4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) dark gray suit at center (B) black metallic microphone at center (C) brown textured suit at center (D) dark suit at center" }, { "from": "gpt", "value": "(A) dark gray suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/494505b3501cdf1b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white paper at center (B) matte paper map at center" }, { "from": "gpt", "value": "(B) matte paper map at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6ff74d3e7fd714e7.jpg", "conversations": [ { "from": "human", "value": "\nDoes printed cotton shirt at upper right appear on the left side of knit sweater at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, printed cotton shirt at upper right is not to the left of knit sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca915d6e16525080.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.426, 0.606) (B) (0.302, 0.891)" }, { "from": "gpt", "value": "(A) (0.426, 0.606)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a565c9e1246213d9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte green car at right (B) white matte car at center (C) white matte vintage car at left" }, { "from": "gpt", "value": "(A) matte green car at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/afedcacfae258db4.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the brown rough log at center? (A) spotted fur leopard at left (B) spotted fur leopard at center (C) brown rough tree trunk at center" }, { "from": "gpt", "value": "(A) spotted fur leopard at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c421b295b1ee9d2e.jpg", "conversations": [ { "from": "human", "value": "\nIs gray matte water at center further to the viewer compared to gray textured tail fin at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, gray matte water at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a13c912caddc1cd2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.285, 0.870) (B) (0.570, 0.603)" }, { "from": "gpt", "value": "(B) (0.570, 0.603)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e029c4bdcf8625ff.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black fabric table at lower right is wider than beige fabric table at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black fabric table at lower right is wider than beige fabric table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f30143cb236bd2e4.jpg", "conversations": [ { "from": "human", "value": "\nIs brushed metal suit at left to the right of light blue shirt at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, brushed metal suit at left is to the left of light blue shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3f63b5e283927e92.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte blue-green hoodie at left have a greater width compared to matte red jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, matte blue-green hoodie at left has a greater width compared to matte red jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fda1187a119c1dcc.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center above wooden gazebo at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy tree at center is above wooden gazebo at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/971256d3f686c01c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.300, 0.705) (B) (0.371, 0.856) (C) (0.326, 0.625)" }, { "from": "gpt", "value": "(C) (0.326, 0.625)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8f2a9620aa7043f5.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if silver metallic car at lower right is bigger than white matte car at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/761baac41839fd04.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is wooden bowl at upper right located relative to speckled feathered bird at left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38f3a23c43be2e5b.jpg", "conversations": [ { "from": "human", "value": "\nWhere is smooth gray bark at left located in relation to pink fabric at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a24f98b518979203.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the dark blue shirt at left among (A) white cotton shirt at right (B) green matte convertible at center (C) satin beige sedan at center (D) green matte car at center?" }, { "from": "gpt", "value": "(C) satin beige sedan at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1080b6e5f9c8d8bf.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.864, 0.484) (B) (0.720, 0.550)" }, { "from": "gpt", "value": "(A) (0.864, 0.484)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ff71ece661a58b51.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dry grass at upper right located in relation to black metal bridge at upper center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e27b83f55e040fd.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue metallic ladder at upper right have a greater width compared to crystal glass chandelier at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, blue metallic ladder at upper right has a greater width compared to crystal glass chandelier at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8ee628fdb30f4736.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) gray textured elephant at center (B) gray matte elephant at lower center" }, { "from": "gpt", "value": "(A) gray textured elephant at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e8814f3c15142e9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) white lace curtain at center (B) green leafy bush at center (C) white lace curtain at left" }, { "from": "gpt", "value": "(A) white lace curtain at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/140a0ab7c15cb7db.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if clear glass window at left is positioned to the left of green glossy table at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, clear glass window at left is positioned on the left side of green glossy table at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd9b8e2584e840f5.jpg", "conversations": [ { "from": "human", "value": "\nIs navy blue polo shirt at left to the left of whiteboard at upper center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, navy blue polo shirt at left is to the left of whiteboard at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6166f774eea8758b.jpg", "conversations": [ { "from": "human", "value": "\nDoes golden fur dog at center have a lesser width compared to black woven collar at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, golden fur dog at center's width is not less than black woven collar at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27600370fcc3df23.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.894, 0.873) (B) (0.365, 0.741)" }, { "from": "gpt", "value": "(A) (0.894, 0.873)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9903b33cc5c473c9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if cobblestone path at center is positioned below blue denim jeans at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, cobblestone path at center is located below blue denim jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/87a9652d5a7c9b86.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at left below green leafy tree at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy tree at left is below green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00328039fca6f64c.jpg", "conversations": [ { "from": "human", "value": "\nIs white plastic picnic table at lower left smaller than white plastic picnic table at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68375170af814250.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray suit at left is positioned below brown wooden table at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12715bb380b7da9d.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the smooth skin baby at lower right? (A) smooth beige doll at center (B) smooth hoodie at center (C) smooth skin child at left" }, { "from": "gpt", "value": "(C) smooth skin child at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f79f55c17c949ba.jpg", "conversations": [ { "from": "human", "value": "\nDoes white paper cupcake at center have a larger size compared to pink frosted ice cream at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white paper cupcake at center is bigger than pink frosted ice cream at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ab198286c45af84.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black hoodie at center appear on the right side of brown checkered shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte black hoodie at center is not on the right side of brown checkered shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d20ef0f94c50b0e3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.381, 0.039) (B) (0.103, 0.830)" }, { "from": "gpt", "value": "(A) (0.381, 0.039)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81f97117bfd6a86b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.138, 0.398) (B) (0.192, 0.503) (C) (0.082, 0.623)" }, { "from": "gpt", "value": "(C) (0.082, 0.623)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b2a0eb1f4d90ba3.jpg", "conversations": [ { "from": "human", "value": "\nDoes cobblestone path at center appear over gray stone stairs at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, cobblestone path at center is above gray stone stairs at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/28c5afe450ae5824.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue hardcover book at center have a greater width compared to hardcover book at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, blue hardcover book at center has a greater width compared to hardcover book at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f248c45f69c323a6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown shingles at upper left is positioned above silver metallic ladder at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, brown shingles at upper left is positioned over silver metallic ladder at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0c5d43727574ff0.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the white satin dress at center? Choose from: (A) rough textured rock at lower left (B) matte black suit at center" }, { "from": "gpt", "value": "(B) matte black suit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc8cce4a6826721b.jpg", "conversations": [ { "from": "human", "value": "\nIs metallic bar stool at center closer to the viewer compared to velvet blue pillow at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is behind velvet blue pillow at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7931c84807f48f14.jpg", "conversations": [ { "from": "human", "value": "\nDoes red matte shirt at right lie behind matte black shirt at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/673e9da5aaf184e9.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.069, 0.509) (B) (0.894, 0.362)" }, { "from": "gpt", "value": "(B) (0.894, 0.362)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4c94f48975e2362.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of metallic silver table at lower left and wooden table at center in the image provided, where is metallic silver table at lower left located with respect to wooden table at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1783a2d3959c629.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) orange jersey at center (B) orange matte t-shirt at center" }, { "from": "gpt", "value": "(B) orange matte t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9a236fedb8f037b9.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of light brown leather jacket at lower left and dark blue jeans at center in the image provided, where is light brown leather jacket at lower left located with respect to dark blue jeans at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cb516c98cb95ff91.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.537, 0.731) (B) (0.365, 0.536) (C) (0.460, 0.814) (D) (0.656, 0.680)" }, { "from": "gpt", "value": "(B) (0.365, 0.536)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f91b852418a4bffd.jpg", "conversations": [ { "from": "human", "value": "\nDoes translucent glass window at center appear on the right side of yellow matte light at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, translucent glass window at center is not on the right side of yellow matte light at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0f6b6c6c0116c1b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.094, 0.648) (B) (0.456, 0.853)" }, { "from": "gpt", "value": "(B) (0.456, 0.853)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/32c6dfedcb623b44.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.188, 0.466) (B) (0.343, 0.181) (C) (0.525, 0.314)" }, { "from": "gpt", "value": "(A) (0.188, 0.466)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ede7d8207c75d90.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) metallic pink ipod at center (B) pink glossy ipod at lower center" }, { "from": "gpt", "value": "(B) pink glossy ipod at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f3ec8e57dbefaa4.jpg", "conversations": [ { "from": "human", "value": "\nIs blue neoprene wetsuit at center above blue matte water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, blue neoprene wetsuit at center is above blue matte water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0af00bb3900255db.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brick textured building at left is smaller than matte black sign at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, brick textured building at left might be larger than matte black sign at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41fbc1f03c5b7f89.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver metallic sedan at lower right appear over black plastic license plate at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbae3a27a86f5b2e.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown dirt track at lower right is smaller than yellow fabric person at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, brown dirt track at lower right might be larger than yellow fabric person at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27a540789efe6d9e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.600, 0.578) (B) (0.961, 0.503)" }, { "from": "gpt", "value": "(B) (0.961, 0.503)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5183f850869aa2f4.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white fluffy snow at center in reference to white snow-covered tree at left? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cebd1057921c7035.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) dark gray metallic helicopter at upper center (B) black matte goggles at left" }, { "from": "gpt", "value": "(A) dark gray metallic helicopter at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6510d7b74f2a4b35.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue/yellow painted locomotive at center is positioned below blue polished metal locomotive at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19bebaa900b6f7da.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) light gray cotton shirt at left (B) transparent plastic cup at center" }, { "from": "gpt", "value": "(A) light gray cotton shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3143678daa4c5e47.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.155, 0.600) (B) (0.709, 0.259) (C) (0.825, 0.331)" }, { "from": "gpt", "value": "(B) (0.709, 0.259)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a36b95831e634ebb.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) green leafy plant at center (B) black cotton polo shirt at center" }, { "from": "gpt", "value": "(A) green leafy plant at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2dbb682baa3a8fee.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black jacket at left have a larger size compared to dark gray leather jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c7239ab0c0aa65ce.jpg", "conversations": [ { "from": "human", "value": "\nIs matte yellow curtain at upper center further to camera compared to white cloth at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/38179db4024c2f08.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the blue fabric shirt at right? (A) denim jacket at center (B) white cotton shirt at center (C) purple matte sweater at center (D) green metallic train at center" }, { "from": "gpt", "value": "(C) purple matte sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12d1159ff1b127b7.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver metallic truck at right appear on the right side of matte red fire truck at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find silver metallic truck at right to the right of matte red fire truck at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7aa41acd93efaace.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) metallic silver shoes at center (B) transparent glass door at center (C) white paper sign at lower left" }, { "from": "gpt", "value": "(C) white paper sign at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d74b3faf3969a57.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the transparent glass window at upper right? Choose among these: (A) matte gray glass window at center (B) matte glass window at center" }, { "from": "gpt", "value": "(B) matte glass window at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/acc1df418be909a1.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of matte black screen at center less distant than that of black matte mouse at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15d582e755231eb4.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of yellow shingles at center and yellow painted wood porch at lower center in the image provided, where is yellow shingles at center located with respect to yellow painted wood porch at lower center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b894ddb3eb113b5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) dark gray matte duck at left (B) black glossy duck at center (C) dark gray matte duck at right" }, { "from": "gpt", "value": "(B) black glossy duck at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/75b8d61c82e4d080.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.428, 0.502) (B) (0.132, 0.972)" }, { "from": "gpt", "value": "(A) (0.428, 0.502)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41516e1149de3f92.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy bush at center right thinner than green rough bark tree at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green leafy bush at center right's width is not less than green rough bark tree at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ad53ceb9385aab0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.631, 0.781) (B) (0.349, 0.883) (C) (0.546, 0.314) (D) (0.830, 0.939)" }, { "from": "gpt", "value": "(B) (0.349, 0.883)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6664e1b0f34d53f2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) green rough bark tree at right (B) green leafy tree at center" }, { "from": "gpt", "value": "(B) green leafy tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/128465f8c24e4857.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow-brick building at center positioned before wooden cart at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of wooden cart at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eea217232aedcd26.jpg", "conversations": [ { "from": "human", "value": "\nWhere is clear glass water at center located in relation to red matte jacket at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4352eafe9a0f4c1f.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.023, 0.992) (B) (0.066, 0.312)" }, { "from": "gpt", "value": "(B) (0.066, 0.312)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b6989d3918788ec.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white checkered shirt at center is positioned above matte black shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white checkered shirt at center is positioned over matte black shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ea3657a07decd7a.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.150, 0.623) (B) (0.225, 0.658)" }, { "from": "gpt", "value": "(A) (0.150, 0.623)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d65b13d3120cd6aa.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte yellow vest at left is thinner than silky blue hair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte yellow vest at left is not thinner than silky blue hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6e503380ea195c1c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the clear plastic keyboard at center? Select from: (A) silver metallic microphone at center (B) silver metallic laptop at right" }, { "from": "gpt", "value": "(B) silver metallic laptop at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f1d71cda4a55e7a.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the white plastic table at center? Choose from: (A) black plastic speaker at center (B) matte black laptop at upper center (C) metallic at upper right (D) white cloth at left" }, { "from": "gpt", "value": "(A) black plastic speaker at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/701ce879c6dcd1c5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) gold metallic plaque at center (B) white glossy rocket at left" }, { "from": "gpt", "value": "(B) white glossy rocket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e09b96d1c7fd0018.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of green leafy tree at right more distant than that of green leafy trees at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dba8514d2ac8540b.jpg", "conversations": [ { "from": "human", "value": "\nDoes gray suit at center appear on the right side of smooth gray suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find gray suit at center to the right of smooth gray suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00399b464a5776cf.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the purple checkered shirt at center? (A) black satin dress at center (B) matte beige shawl at left (C) matte blue shirt at center" }, { "from": "gpt", "value": "(A) black satin dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b3e0cf312e1ac968.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the white matte jersey at center? (A) blue jersey at center (B) black jersey at center (C) green grass at center" }, { "from": "gpt", "value": "(B) black jersey at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/47b53d83dba9c5f6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) green leafy tree at upper right (B) green grass at center, is positioned closest to the dirt path at center?" }, { "from": "gpt", "value": "(B) green grass at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78cc6544abf84953.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of yellow glossy cake at left less distant than that of yellow glossy cake at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of yellow glossy cake at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5cacd4467d9b96d2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.407, 0.927) (B) (0.280, 0.505)" }, { "from": "gpt", "value": "(B) (0.280, 0.505)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bcbd1579e8dbf979.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.313, 0.650) (B) (0.679, 0.086)" }, { "from": "gpt", "value": "(A) (0.313, 0.650)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4ab7bb20294a721.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at lower center appear on the right side of shiny red sedan at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, green grass at lower center is positioned on the right side of shiny red sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae4af23121905157.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark gray cloud at upper center is positioned below white glossy cruise ship at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, dark gray cloud at upper center is not positioned below white glossy cruise ship at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6be1324b03f25f03.jpg", "conversations": [ { "from": "human", "value": "\nDoes shiny metallic sunglasses at center lie behind skinsmoothhand at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b97604ad52cca01.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of clear glass window at center and transparent glass window at upper center in the image provided, where is clear glass window at center located with respect to transparent glass window at upper center? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/823c70e6cbf21e1e.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of black textured dress at center and smooth bald head at center in the image provided, where is black textured dress at center located with respect to smooth bald head at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c62029b4f1bb8ff.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the green matte ship at center? (A) pink fabric at lower left (B) blue fabric at lower center (C) blue shirt at lower left (D) transparent water at lower right" }, { "from": "gpt", "value": "(A) pink fabric at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94a5435207b44f01.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte truck at lower right wider than shiny black sedan at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbdc60b09556f0c2.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.185, 0.380) (B) (0.447, 0.758) (C) (0.473, 0.698)" }, { "from": "gpt", "value": "(C) (0.473, 0.698)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/66f1cb93fdd1a8d6.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if transparent glass windshield at center is thinner than matte black sedan at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, transparent glass windshield at center might be wider than matte black sedan at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46bafefecc8e60e6.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white stone lion at upper center located relative to yellow leafy branches at upper left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/290241db1bc5444d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) blue dotted shirt at upper left (B) floral cotton dress at lower right (C) striped cotton shirt at center" }, { "from": "gpt", "value": "(C) striped cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/deaa51eef6ba431c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.211, 0.316) (B) (0.564, 0.634) (C) (0.169, 0.431) (D) (0.079, 0.980)" }, { "from": "gpt", "value": "(C) (0.169, 0.431)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0561be6dc0b4e908.jpg", "conversations": [ { "from": "human", "value": "\nIs green matte plate at center above white glossy plate at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, green matte plate at center is below white glossy plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0010636567c3193d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.203, 0.473) (B) (0.187, 0.830)" }, { "from": "gpt", "value": "(A) (0.203, 0.473)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b304744768f8def0.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte convertible at center is positioned to the right of white satin dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white matte convertible at center is to the right of white satin dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70007519c1deb139.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.434, 0.125) (B) (0.904, 0.298) (C) (0.518, 0.217) (D) (0.932, 0.864)" }, { "from": "gpt", "value": "(A) (0.434, 0.125)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/051289a080bb8d58.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if knitted wool scarf at center is positioned to the left of matte brown jacket at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, knitted wool scarf at center is to the left of matte brown jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/42cca5e6dee1def8.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of brown brick tower at upper center in reference to clear glass lantern at upper right? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19d63a60eb835f98.jpg", "conversations": [ { "from": "human", "value": "\nDoes metallic silver bicycle at center have a smaller size compared to dark gray fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, metallic silver bicycle at center is not smaller than dark gray fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/97033bfbd22c6844.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of wooden dock at center in reference to brown wooden dock at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bc5e2c74188691b3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) maroon shirt at upper center (B) white matte shirt at upper right" }, { "from": "gpt", "value": "(A) maroon shirt at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9b2df80ec82532bd.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear glass tunnel at center have a greater width compared to green textured tree at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, clear glass tunnel at center is not wider than green textured tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3af954d485f345c2.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.752, 0.272) (B) (0.433, 0.362) (C) (0.073, 0.266)" }, { "from": "gpt", "value": "(B) (0.433, 0.362)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/202e37b159e2e603.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of shiny black ant at center less distant than that of shiny black ant at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/068ac4bf7ba4c1de.jpg", "conversations": [ { "from": "human", "value": "\nDoes sandy beach at center appear under transparent water at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/589c9fc9cd96f067.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is white matte unicorn head at center located relative to matte black mask at center? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc7128482ccefa8a.jpg", "conversations": [ { "from": "human", "value": "\nIs brown matte water at lower left behind black matte ship at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/421e9a8bbe3995f3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.512, 0.248) (B) (0.518, 0.472)" }, { "from": "gpt", "value": "(B) (0.518, 0.472)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/54cacab2c5ff6ca2.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy tree at center is positioned to the right of brown muddy water at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy tree at center is to the right of brown muddy water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4bc708c2ca7e6836.jpg", "conversations": [ { "from": "human", "value": "\nIs snow-covered wooden roof at upper center positioned behind brown wooden fence at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is behind brown wooden fence at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c131417902b8804.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the light brown wood table at lower left? (A) black suit at left (B) uniformed military officer at center" }, { "from": "gpt", "value": "(B) uniformed military officer at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48ffeb7d6005a3ff.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black suit at left positioned at the back of striped fabric tie at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6d97637436135360.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) blue plastic parking sign at lower center (B) black wrought iron balcony at center" }, { "from": "gpt", "value": "(B) black wrought iron balcony at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f3df2333ed7e2dbf.jpg", "conversations": [ { "from": "human", "value": "\nIs white painted metal tower at upper right above white painted wood at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, white painted metal tower at upper right is positioned over white painted wood at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53232967c1c9a9be.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if charred wood log at center is positioned to the left of black textured whale at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, charred wood log at center is to the right of black textured whale at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/101a5ab1fc451da8.jpg", "conversations": [ { "from": "human", "value": "\nIs white fabric raft at center thinner than white plastic paddle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white fabric raft at center's width is not less than white plastic paddle at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/82ca386bdd26811c.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of snowy rock at center and brown fur at center in the image provided, where is snowy rock at center located with respect to brown fur at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fbfb6cc82e0910c8.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) shiny blue snowboard at upper left (B) white matte snowboarder at center (C) gray matte snowboarder at upper left" }, { "from": "gpt", "value": "(A) shiny blue snowboard at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b0569a86d2fdbf35.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown hair at center thinner than smooth skin face at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b803722550d9f3e9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte terracotta head at center is smaller than matte terracotta head at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte terracotta head at center is not smaller in size than matte terracotta head at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3458fb224037f830.jpg", "conversations": [ { "from": "human", "value": "\nIs major red pattern radiations at upper center closer to the viewer compared to matte white butterfly at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/abec53069698d280.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) rubberized yellow toy at center (B) white plastic table at center (C) rubber matte block at table" }, { "from": "gpt", "value": "(B) white plastic table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0353c1d2ace2ab5d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.091, 0.689) (B) (0.565, 0.383)" }, { "from": "gpt", "value": "(B) (0.565, 0.383)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0c16f7876f54294.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the brown wooden chair at center from the following options: (A) wooden rocking chair at center (B) clear glass door at left?" }, { "from": "gpt", "value": "(B) clear glass door at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/70b4f8009860abc4.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of concrete steps at center more distant than that of clear blue water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, concrete steps at center is in front of clear blue water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/457b68b4f60ce4ed.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) brown brick chimney at upper center (B) white brick chimney at upper center" }, { "from": "gpt", "value": "(B) white brick chimney at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5083f8721a34bc5.jpg", "conversations": [ { "from": "human", "value": "\nIs white translucent cubes at center thinner than transparent glass bowl at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white translucent cubes at center's width is not less than transparent glass bowl at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bbcf7529da578ef4.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) yellow matte signboard at center (B) yellow matte/black textured cross at upper center (C) metallic pole at center (D) yellow/yellowish metal sign at lower center" }, { "from": "gpt", "value": "(D) yellow/yellowish metal sign at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/39b627c92c0d81ca.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at center appear on the right side of shiny black motorcycle at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green leafy tree at center is to the right of shiny black motorcycle at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a62e0cbbdf19fbb9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white glossy boat at lower left is bigger than dark gray metallic sailboat at center-left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, white glossy boat at lower left is larger in size than dark gray metallic sailboat at center-left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/caca5acbb78034fb.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if bare branches at upper center is positioned to the left of green leafy bush at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find bare branches at upper center to the left of green leafy bush at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a8dc52b6c854c16d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny purple chocolate bar at right is positioned to the left of translucent plastic bag of candy at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, shiny purple chocolate bar at right is not to the left of translucent plastic bag of candy at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/629b1208aeb9c282.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is dark brown bark tree at left located relative to bare branches at left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ade27a6b867eca66.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.529, 0.681) (B) (0.411, 0.775) (C) (0.497, 0.830)" }, { "from": "gpt", "value": "(B) (0.411, 0.775)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1799a2b22931c207.jpg", "conversations": [ { "from": "human", "value": "\nIs denim shirt at left above smooth concrete curb at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, denim shirt at left is above smooth concrete curb at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f903e58ae1a55d23.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the dark skin tattoo at upper center? Choose from: (A) brownhair at center (B) matte skin face at center (C) tattooed skin at upper center" }, { "from": "gpt", "value": "(B) matte skin face at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b26e5bd7b357fe0.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of matte paper poster at upper right and matte paper maps & instruments at center in the image provided, where is matte paper poster at upper right located with respect to matte paper maps & instruments at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcc9f07afc9197a8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte tank top at left is positioned to the left of white matte tank top at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, black matte tank top at left is positioned on the left side of white matte tank top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c88a0d612dba128a.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the yellow reflective vest at center? Choose from: (A) high-visibility fabric safety vest at center (B) yellow reflective safety vest at upper center (C) white smooth concrete at center" }, { "from": "gpt", "value": "(C) white smooth concrete at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1ec95d514f2dd169.jpg", "conversations": [ { "from": "human", "value": "\nIs white glossy table at center below blue cotton shirt at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, white glossy table at center is located below blue cotton shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/56cc8343bb851515.jpg", "conversations": [ { "from": "human", "value": "\nWhere is shiny gray pagoda at upper right located in relation to gray foggy mountain at left in the image? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88e8e7b907f9fa0a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if yellow plastic boat at center is positioned above red plastic food cart at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, yellow plastic boat at center is not above red plastic food cart at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0fa30f4b4e744196.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown/dry soil at left is smaller than asphalt road at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, brown/dry soil at left might be larger than asphalt road at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0a90ac0fd46f732.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue liquid water at lower center is bigger than green matte tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, blue liquid water at lower center is not larger than green matte tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6077046eb6a6d850.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the black asphalt pavement at lower left? (A) yellow matte tree at upper right (B) silver metallic street sign at left" }, { "from": "gpt", "value": "(B) silver metallic street sign at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/57ea49271a4eaf6a.jpg", "conversations": [ { "from": "human", "value": "\nIs paper map at center positioned in front of matte black sunglasses at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/673fd087855488a5.jpg", "conversations": [ { "from": "human", "value": "\nDoes camouflage fabric uniform at left appear on the right side of american flag at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, camouflage fabric uniform at left is to the left of american flag at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b7d36bc19a9069ff.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.680, 0.836) (B) (0.333, 0.047)" }, { "from": "gpt", "value": "(A) (0.680, 0.836)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4ad4364bb58839c8.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at left further to the viewer compared to green leafy tree at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is in front of green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8684e19fa17f8794.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if smooth asphalt road at center is wider than black plastic mirror at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, smooth asphalt road at center is not wider than black plastic mirror at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aa357a97468a397f.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of wooden table at center more distant than that of wooden table at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3c520e92b31e5576.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the white matte shirt at center? (A) white cotton robe at center (B) light blue fabric at center" }, { "from": "gpt", "value": "(B) light blue fabric at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c2bb842a605c0ea.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.738, 0.620) (B) (0.848, 0.633) (C) (0.074, 0.511) (D) (0.469, 0.561)" }, { "from": "gpt", "value": "(C) (0.074, 0.511)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00dde8c962443880.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent glass skyscraper at center appear over dark green water at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, transparent glass skyscraper at center is positioned over dark green water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25ca0082fb44d84a.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at upper center below green textured rock at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, green leafy tree at upper center is located below green textured rock at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4c564f8c8f9d4b83.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the silver metallic sedan at center? Choose among these: (A) black fabric shirt at right (B) black matte jacket at center" }, { "from": "gpt", "value": "(B) black matte jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5cfeea70cfa5a05a.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of black metal chair at left in relation to white fur cat at lower left? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3ac431e46661564.jpg", "conversations": [ { "from": "human", "value": "\nIs green stone hedge at center to the right of green leafy tree at upper center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, green stone hedge at center is to the left of green leafy tree at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a70c09d124f04e0f.jpg", "conversations": [ { "from": "human", "value": "\nDoes printed fabric shirt at center appear on the left side of green fabric cap at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, printed fabric shirt at center is to the right of green fabric cap at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62c83c9da22fe6cf.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the red glass tabasco bottle at center? Choose from: (A) translucent plastic tabasco bottle at center (B) yellow translucent bottle at center-right (C) shiny green plastic tube of candy at left (D) clear plastic bottle of vegetable oil at center" }, { "from": "gpt", "value": "(A) translucent plastic tabasco bottle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3736207564cf6790.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.612, 0.923) (B) (0.802, 0.467)" }, { "from": "gpt", "value": "(B) (0.802, 0.467)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11143feb22db2ff5.jpg", "conversations": [ { "from": "human", "value": "\nIs black-spotted fur dog at lower center smaller than spotted fur dog at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, black-spotted fur dog at lower center is smaller than spotted fur dog at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e2ccebb5acd3f4e.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the white fabric man at center? (A) white wool coat at upper right (B) purple cotton t-shirt at lower center" }, { "from": "gpt", "value": "(A) white wool coat at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37165c140f2ed1d0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.370, 0.997) (B) (0.125, 0.878)" }, { "from": "gpt", "value": "(A) (0.370, 0.997)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c15b568c4ba0fdcc.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow printed fabric at center lie in front of matte black head at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, yellow printed fabric at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e30373f4256463f2.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) green plastic power tool at center (B) green plastic tool at center (C) metallic silver shovel at lower right, is positioned closest to the silver metallic ladder at center?" }, { "from": "gpt", "value": "(B) green plastic tool at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/350c4c2fc48be4f5.jpg", "conversations": [ { "from": "human", "value": "\nIs white shirt at upper center smaller than blue cotton shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, white shirt at upper center occupies less space than blue cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04d2142ceeff1fd1.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) gray stone stairs at center (B) white leather sandal at lower left (C) black straw hat at center" }, { "from": "gpt", "value": "(C) black straw hat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/edd8ac48a7490773.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.572, 0.822) (B) (0.239, 0.559)" }, { "from": "gpt", "value": "(B) (0.239, 0.559)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/081e597c6617e715.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.959, 0.598) (B) (0.486, 0.220) (C) (0.186, 0.698) (D) (0.361, 0.609)" }, { "from": "gpt", "value": "(B) (0.486, 0.220)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c17ab94cb0047c6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.191, 0.266) (B) (0.402, 0.866)" }, { "from": "gpt", "value": "(A) (0.191, 0.266)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5368286e925b0a26.jpg", "conversations": [ { "from": "human", "value": "\nIs black graffiti at center closer to the viewer compared to brushed metal jeep at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is behind brushed metal jeep at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/388f0d5b1094a720.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) shiny dark gray spire at center-left (B) golden yellow leaves at upper right (C) golden foliage at center (D) transparent glass water at center" }, { "from": "gpt", "value": "(D) transparent glass water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5b184a5876bf99de.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) orange fabric helmet at center (B) white striped shirt at upper center" }, { "from": "gpt", "value": "(A) orange fabric helmet at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/98f92e6d9b90e059.jpg", "conversations": [ { "from": "human", "value": "\nIs matte beige dress at center closer to the viewer compared to multicolored silk headscarf at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is in front of multicolored silk headscarf at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0917b185146b06d.jpg", "conversations": [ { "from": "human", "value": "\nIs brown embroidered pillow at lower left bigger than orange fur tail at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, brown embroidered pillow at lower left is larger in size than orange fur tail at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5e1488d3f32b3525.jpg", "conversations": [ { "from": "human", "value": "\nIs dark wood table at center above dark brown hair at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, dark wood table at center is not positioned above dark brown hair at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/816c505820fafb9a.jpg", "conversations": [ { "from": "human", "value": "\nDoes black wetsuit surfer at center have a lesser width compared to dark gray sweater at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black wetsuit surfer at center's width is not less than dark gray sweater at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1fc0a5f183f69c0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.746, 0.858) (B) (0.938, 0.708)" }, { "from": "gpt", "value": "(A) (0.746, 0.858)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1552e0403d8aba5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.049, 0.236) (B) (0.091, 0.606) (C) (0.297, 0.620) (D) (0.542, 0.312)" }, { "from": "gpt", "value": "(B) (0.091, 0.606)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3b6fe8eb40587140.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of matte black signboard at center and black satin suit at center in the image provided, where is matte black signboard at center located with respect to black satin suit at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/15944f4df377239a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.472, 0.445) (B) (0.536, 0.231) (C) (0.370, 0.002)" }, { "from": "gpt", "value": "(C) (0.370, 0.002)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/674e6e295c6e3d68.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at upper center to the right of green grass at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy tree at upper center is to the right of green grass at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/50cba6f1acbd4a36.jpg", "conversations": [ { "from": "human", "value": "\nIs black glass window at center behind gray stone crack at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35ddd693e0a9af18.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white fabric dome at center is smaller than dark blue jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, white fabric dome at center might be larger than dark blue jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ef7da49ea8f94245.jpg", "conversations": [ { "from": "human", "value": "\nDoes pale skin at lower right appear on the left side of white fabric lounge chair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, pale skin at lower right is to the left of white fabric lounge chair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a64f065622a3602d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) gold metallic crown at upper center (B) dark gray sweatshirt at center" }, { "from": "gpt", "value": "(B) dark gray sweatshirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/007a8a03f37c7c11.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the light brown hair at center among (A) light blue t-shirt at center (B) white cotton crowd at center (C) dark blue polo shirt at center (D) white floral dress at center?" }, { "from": "gpt", "value": "(C) dark blue polo shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/31d44f2a7d2389ac.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black dress at center is thinner than black lace dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, matte black dress at center is thinner than black lace dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5f586bc72683a4f5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green reflective safety vest at upper right (B) green reflective vest at center (C) high-visibility fabric jacket at center" }, { "from": "gpt", "value": "(C) high-visibility fabric jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e5d75ea133ac843b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark blue van at center is wider than metallic silver sedan at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5af2caa0c328709.jpg", "conversations": [ { "from": "human", "value": "\nIs green striped shirt at center positioned behind black textured baseball cap at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0080460633eed194.jpg", "conversations": [ { "from": "human", "value": "\nIs blue cotton shirt at upper center wider than leather gun at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d3e5970ab91457d9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown matte shirt at center is positioned above matte black sunglasses at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, brown matte shirt at center is located above matte black sunglasses at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4ca112316d155a1.jpg", "conversations": [ { "from": "human", "value": "\nDoes black dress at lower left appear over red fabric dress at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black dress at lower left is above red fabric dress at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cbd75669fa34fd85.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray fabric shirt at center is bigger than silvery metallic fish at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bbe7c5ddf20feab0.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) white matte jacket at center (B) pink fabric baby at center (C) green matte shirt at left (D) wooden bench at center" }, { "from": "gpt", "value": "(B) pink fabric baby at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/19e40fe1522d4571.jpg", "conversations": [ { "from": "human", "value": "\nWhere is leather fringe vest at center located in relation to brown suede cape at center in the image? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/042272284cb6527a.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white marble rabbit at center is thinner than matte bark tree at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07865168290e64e5.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the green matte shirt at center? (A) purple floral dress at center (B) purple fabric doll at center (C) white cotton dress at left" }, { "from": "gpt", "value": "(A) purple floral dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/06b46c761d135453.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green textured forest at upper center in relation to green matte tree at lower left? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2fb596587cadaf90.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) wooden table at lower left (B) metallic mesh table at lower left" }, { "from": "gpt", "value": "(A) wooden table at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9264ba92c28f7987.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy tree at upper center have a greater width compared to brown gravel pile at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, the width of green leafy tree at upper center exceeds that of brown gravel pile at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/81be91c4957d2f84.jpg", "conversations": [ { "from": "human", "value": "\nIs black leather jacket at center wider than red velvet coat at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black leather jacket at center is not wider than red velvet coat at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e0669dfc3daa848.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of painted wood horse at center in relation to shiny white horse at left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc0ab08cfd37864b.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if green leafy grass at center is positioned to the right of green needle-like leaves at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, green leafy grass at center is to the right of green needle-like leaves at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d6972a356dbea814.jpg", "conversations": [ { "from": "human", "value": "\nDoes green smooth water at center have a smaller size compared to gray rough rock at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, green smooth water at center might be larger than gray rough rock at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/161cdaa93fed7e28.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark blue shirt at center have a lesser width compared to red t-shirt at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, dark blue shirt at center might be wider than red t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2a21598edd8799e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) matte green shirt at center (B) matte red scooter at center (C) red matte/metallic food truck at center" }, { "from": "gpt", "value": "(A) matte green shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c52896f6e8a407da.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) green leafy bush at upper left (B) metallic tripod at left" }, { "from": "gpt", "value": "(B) metallic tripod at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04d7411555c69bd7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.839, 0.775) (B) (0.769, 0.264) (C) (0.528, 0.517)" }, { "from": "gpt", "value": "(C) (0.528, 0.517)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/292469b85ac9b396.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent glass window at center appear on the right side of green matte forest at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, transparent glass window at center is not to the right of green matte forest at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89aa27db59ccf623.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the black matte bicycle at left? Select from: (A) silver metallic wheel at lower center (B) white striped shirt at lower right" }, { "from": "gpt", "value": "(B) white striped shirt at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b04423a7ec716b85.jpg", "conversations": [ { "from": "human", "value": "\nDoes dark glass bottle at lower right appear on the left side of dark red glass bottle at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, dark glass bottle at lower right is not on the left side of dark red glass bottle at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e68d3768da983d09.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte pink shirt at center located in relation to batik-patterned dress at center in the image? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95cd48abfc62d56a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.345, 0.828) (B) (0.277, 0.561)" }, { "from": "gpt", "value": "(A) (0.345, 0.828)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5364f40173674293.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green grass at center located in relation to blue fabric at right in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9674cb891d2cd6f1.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.815, 0.775) (B) (0.251, 0.812)" }, { "from": "gpt", "value": "(A) (0.815, 0.775)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e721f39b564c8a73.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark brown hair at upper center is positioned below blue glossy eye at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, dark brown hair at upper center is below blue glossy eye at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0801d3439d07109b.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the knitted beige cardigan at center? Choose among these: (A) matte black scarf at center (B) brown leather jacket at left" }, { "from": "gpt", "value": "(B) brown leather jacket at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e823c79fce20944f.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) green fabric shirt at right (B) green cotton shirt at center (C) blue water at center" }, { "from": "gpt", "value": "(A) green fabric shirt at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f88b5c85c6152bd.jpg", "conversations": [ { "from": "human", "value": "\nIs blue woolen jacket at center bigger than white knitted sweater at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07f7e5b08dde52fc.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte jacket at center is positioned to the left of shiny metallic ski at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find white matte jacket at center to the left of shiny metallic ski at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4e1d5510bfe8a2e7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) black leather jacket at center (B) leopard print dress at center (C) shiny brown electric guitar at center" }, { "from": "gpt", "value": "(B) leopard print dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c8ce872a79e42b3.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white glossy smartphone at center (B) orange wood pen at center" }, { "from": "gpt", "value": "(B) orange wood pen at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9379674a0494bf76.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray textured suit at center is wider than white striped tie at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of gray textured suit at center exceeds that of white striped tie at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1144a3de852a6b4a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.014, 0.389) (B) (0.540, 0.316)" }, { "from": "gpt", "value": "(B) (0.540, 0.316)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd516d25875c8fb9.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.967, 0.125) (B) (0.733, 0.386) (C) (0.169, 0.786)" }, { "from": "gpt", "value": "(A) (0.967, 0.125)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b459a1e87ee9450c.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) translucent pink exoskeleton at center (B) translucent pink shrimp at upper left" }, { "from": "gpt", "value": "(A) translucent pink exoskeleton at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a37b3345d27283d9.jpg", "conversations": [ { "from": "human", "value": "\nIs gray concrete path at center wider than matte black stroller at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/045733d92f906838.jpg", "conversations": [ { "from": "human", "value": "\nDoes white sequined shirt at center have a smaller size compared to white sequined top at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white sequined shirt at center is not smaller than white sequined top at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/455e02bfd1934eeb.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the blue metallic car at center? Select from: (A) asphalt road at center (B) blue glossy car at center" }, { "from": "gpt", "value": "(B) blue glossy car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52a585e0b4769df8.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center to the left of stone arch bridge at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, green leafy tree at center is not on the left side of stone arch bridge at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04f9bdad5934e688.jpg", "conversations": [ { "from": "human", "value": "\nWhere is white paper book at center located in relation to clear plastic goggles at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf8379de677b7911.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white matte ambulance at center is positioned below white plastic license plate at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white matte ambulance at center is not positioned below white plastic license plate at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2df0373fbbc7bb3e.jpg", "conversations": [ { "from": "human", "value": "\nIs matte red shirt at center thinner than red plastic shovel at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2fe6d19942fb2c03.jpg", "conversations": [ { "from": "human", "value": "\nDoes smooth suit at upper right have a greater width compared to dark blue suit at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, smooth suit at upper right is wider than dark blue suit at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d89b8972e04f1084.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown leather swivel chair at left is positioned to the left of metallic silver bookshelf at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, brown leather swivel chair at left is to the right of metallic silver bookshelf at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/16d1d4b583b028c7.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the red fabric at lower right? Choose from: (A) shiny green costume at center (B) pink satin umbrella at center" }, { "from": "gpt", "value": "(A) shiny green costume at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/41715fa296522677.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte green t-shirt at center (B) white dotted shirt at upper right" }, { "from": "gpt", "value": "(B) white dotted shirt at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5469964829a0352c.jpg", "conversations": [ { "from": "human", "value": "\nDoes red/white striped flag at upper center appear under camouflage fabric uniform at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, red/white striped flag at upper center is above camouflage fabric uniform at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0c765f59623552b4.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green grass football field at center located in relation to white matte shirt at center in the image? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b2bf2314f2ae78f7.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned closest to the black fur dog at center? Select from: (A) orange shirt at left (B) blue cotton shirt at center" }, { "from": "gpt", "value": "(B) blue cotton shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f49a348449e16427.jpg", "conversations": [ { "from": "human", "value": "\nWhere is matte orange sweatshirt at center located in relation to golden brown crispy chicken at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2ba3cc3a5003932d.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.035, 0.766) (B) (0.270, 0.362) (C) (0.170, 0.292)" }, { "from": "gpt", "value": "(A) (0.035, 0.766)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c2d1081932121a42.jpg", "conversations": [ { "from": "human", "value": "\nDoes green leafy palm tree at left have a smaller size compared to black glossy car at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8604b6a2a21b1a6d.jpg", "conversations": [ { "from": "human", "value": "\nIs matte green shirt at center positioned before smooth gray pole at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/606122b3fb399b72.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.616, 0.536) (B) (0.178, 0.730) (C) (0.922, 0.466)" }, { "from": "gpt", "value": "(C) (0.922, 0.466)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/807cdd1d5a5969d8.jpg", "conversations": [ { "from": "human", "value": "\nIs beige fabric canopy bed at center wider than wooden table at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, beige fabric canopy bed at center is wider than wooden table at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2119f94f34f70e88.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center in front of green leafy plant at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/61f24e72c764ef45.jpg", "conversations": [ { "from": "human", "value": "\nWhere is green leafy tree at left located in relation to green rough bark tree at right in the image? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea80d60181f33365.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) brown matte water at center (B) brown fabric bag at right (C) dark green fabric person at center (D) brown fabric person at center" }, { "from": "gpt", "value": "(C) dark green fabric person at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/797d4d5375744eee.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fabric crowd at center appear over shiny orange jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, white fabric crowd at center is positioned over shiny orange jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/25b9515a85d121be.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.765, 0.844) (B) (0.372, 0.438)" }, { "from": "gpt", "value": "(A) (0.765, 0.844)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/391a9ff61af5540a.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.343, 0.478) (B) (0.463, 0.448) (C) (0.161, 0.864)" }, { "from": "gpt", "value": "(B) (0.463, 0.448)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00ca3d90f61229c1.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) wooden beam at center (B) white paper lantern at upper right" }, { "from": "gpt", "value": "(B) white paper lantern at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ffbca833f482698e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.759, 0.750) (B) (0.485, 0.556) (C) (0.622, 0.752) (D) (0.198, 0.505)" }, { "from": "gpt", "value": "(A) (0.759, 0.750)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/000b72e1446f8849.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown leather couch at center appear over matte red blazer at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0eae6cb4dd8d4e26.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.634, 0.573) (B) (0.805, 0.202) (C) (0.484, 0.561) (D) (0.186, 0.619)" }, { "from": "gpt", "value": "(D) (0.186, 0.619)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6581c5a94bb94b0c.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte black guitar at center is positioned to the left of black leather jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte black guitar at center is not to the left of black leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34ddf8765b9ebd78.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red striped shirt at left is thinner than white satin blouse at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, red striped shirt at left's width is less than white satin blouse at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4038afcc2eb1f0d9.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) black fabric dress at center (B) printed fabric dress at center (C) dark blue shirt at center" }, { "from": "gpt", "value": "(B) printed fabric dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77150990bd32890c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) black shirt at left (B) light blue shirt at right" }, { "from": "gpt", "value": "(A) black shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e162060deb27b67.jpg", "conversations": [ { "from": "human", "value": "\nDoes white snow-covered tree at center appear over snow-covered evergreen at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, white snow-covered tree at center is below snow-covered evergreen at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c917252f38994e75.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow matte airplane at center behind shiny metallic airplane at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, yellow matte airplane at center is further from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1897a2cd46e9127.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the white matte volleyball at upper center? Choose among these: (A) blue matte volleyball player at center (B) white mesh net at center (C) black synthetic volleyball at center" }, { "from": "gpt", "value": "(B) white mesh net at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37bd3d16f8a213f6.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) blue fabric canopy at upper center (B) black matte jacket at center (C) metallic silver foil at right (D) red matte jacket at lower left" }, { "from": "gpt", "value": "(A) blue fabric canopy at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ae1a6a6465d6738d.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the green grass at center from the following options: (A) pink jersey at left (B) black matte shirt at center?" }, { "from": "gpt", "value": "(A) pink jersey at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e70dfeef38c9baa7.jpg", "conversations": [ { "from": "human", "value": "\nDoes granite pillar at center appear under green leafy tree at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, granite pillar at center is positioned under green leafy tree at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f1782670062c97be.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) matte black jacket at center (B) orange cotton t-shirt at center" }, { "from": "gpt", "value": "(B) orange cotton t-shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4d5f7d499889757.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if bare branches at upper center is positioned to the right of green leafy tree at upper left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, bare branches at upper center is to the right of green leafy tree at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e16f830cffe19cbf.jpg", "conversations": [ { "from": "human", "value": "\nDoes teal denim jacket at left appear under matte black blazer at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/12be405cf289e336.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.101, 0.792) (B) (0.274, 0.312)" }, { "from": "gpt", "value": "(A) (0.101, 0.792)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/921d5e44e89a072d.jpg", "conversations": [ { "from": "human", "value": "\nDoes red painted metal sign at upper center appear over matte black shirt at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, red painted metal sign at upper center is above matte black shirt at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d96320de43753ed.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) black puffy coat at center (B) dark brown fur at center" }, { "from": "gpt", "value": "(A) black puffy coat at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3099486d77359608.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.472, 0.266) (B) (0.737, 0.414)" }, { "from": "gpt", "value": "(B) (0.737, 0.414)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/caf4f64aec2dabd8.jpg", "conversations": [ { "from": "human", "value": "\nIs multicolored costume at center bigger than pink fabric dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/262c2189dbedd291.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow matte jersey at center to the right of light blue fabric shorts at center from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, yellow matte jersey at center is not to the right of light blue fabric shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aed2a0bdcf9b2f7a.jpg", "conversations": [ { "from": "human", "value": "\nDoes light gray fabric shirt at right come behind gray wool suit at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e1fce4941bdab1f7.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of striped shirt at center in relation to green fabric jacket at center? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3ba17f084b61206c.jpg", "conversations": [ { "from": "human", "value": "\nIs yellow smooth banana at upper center wider than yellowish matte bread at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, yellow smooth banana at upper center might be narrower than yellowish matte bread at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9e58967e0bbbc48.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at center below matte pink dress at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8bea9a6ce68ae24f.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black binoculars at center appear on the right side of black rubber binoculars at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, matte black binoculars at center is not to the right of black rubber binoculars at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/911134b6c4f05371.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) yellow plastic paddle at left (B) yellow plastic paddle at right (C) blue/textured life jacket at center (D) blue painted wood boat at center" }, { "from": "gpt", "value": "(B) yellow plastic paddle at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04527674f720be5d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) dark brown leather jacket at center (B) wooden rail at center" }, { "from": "gpt", "value": "(A) dark brown leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94c0642afec2cc2c.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green glass traffic light at upper center and matte black car at center in the image provided, where is green glass traffic light at upper center located with respect to matte black car at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/69bc23b1ca85f728.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is yellow matte skateboard at center located relative to white glossy car at lower left? (A) right (B) left" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14650013756dc7e7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if concrete at lower right is positioned below black matte motorcycle at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, concrete at lower right is not below black matte motorcycle at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/722718b986f2f568.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.272, 0.547) (B) (0.655, 0.391)" }, { "from": "gpt", "value": "(B) (0.655, 0.391)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7c9b54c1b56fa414.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is green leafy tree at center located relative to green leafy tree at upper left? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c60a868565d0a6b5.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) smooth gray mountain at center (B) bright white orb at upper left" }, { "from": "gpt", "value": "(A) smooth gray mountain at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7ca4b90c5c53d78e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.989, 0.631) (B) (0.301, 0.444)" }, { "from": "gpt", "value": "(B) (0.301, 0.444)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf0b12e10b276af7.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown fabric headscarf at lower left have a larger size compared to rainbow fabric umbrella at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, brown fabric headscarf at lower left is not larger than rainbow fabric umbrella at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9fa4e87cd7a252cd.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the glossy red pillar at center-left? Choose among these: (A) shiny red pillar at center (B) matte red pillar at center" }, { "from": "gpt", "value": "(A) shiny red pillar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/52825a1c126e699e.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) pale skin at center (B) gray concrete stone at center (C) green matte seedling at center" }, { "from": "gpt", "value": "(C) green matte seedling at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e39915cc4005b21.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears closest to the camera in this image? (A) white plastic ship at center (B) polished metal statue at center" }, { "from": "gpt", "value": "(A) white plastic ship at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a0510ca49de2579a.jpg", "conversations": [ { "from": "human", "value": "\nIs brown glossy horse at center bigger than blue cotton shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, brown glossy horse at center is not larger than blue cotton shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c826772253aebe55.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of matte brown shirt at center in relation to matte skin nose at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c053ab4d884cb53.jpg", "conversations": [ { "from": "human", "value": "\nDoes red cotton shirt at lower left appear on the left side of plaid fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, you'll find red cotton shirt at lower left to the left of plaid fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f425300c2f0bca04.jpg", "conversations": [ { "from": "human", "value": "\nDoes white striped polo shirt at center appear under blue jersey at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/972dc188537470e5.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte black lamp post at center (B) wooden bench at center (C) black matte pole at right" }, { "from": "gpt", "value": "(A) matte black lamp post at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fb811c83c3b5cb0.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white glossy window at upper center (B) transparent glass airplane window at center" }, { "from": "gpt", "value": "(B) transparent glass airplane window at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a96091dd9f246783.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of white marble statue at center in reference to white marble mask at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/035e39ffbc6ee986.jpg", "conversations": [ { "from": "human", "value": "\nIs white marble bust at center below white stone inscription at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Actually, white marble bust at center is above white stone inscription at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/27f5238186917d06.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) brown muddy water at lower left (B) polished wood steamboat at left" }, { "from": "gpt", "value": "(A) brown muddy water at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0bbeb21353306d13.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the velvety red dress at center? Choose from: (A) fuzzy brown teddy bear at center (B) fuzzy brown teddy bear at left (C) fuzzy brown teddy bear at right" }, { "from": "gpt", "value": "(B) fuzzy brown teddy bear at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/86c3e70f028c2854.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center behind brown metal/wooden bleacher at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, green leafy tree at center is further from the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d93b07bf89b852dd.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of concrete building at center and rustic wooden wagon at center in the image provided, where is concrete building at center located with respect to rustic wooden wagon at center? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/db58aa1c522e1382.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of matte red hoodie at left more distant than that of green matte jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, matte red hoodie at left is in front of green matte jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea859143b0c6949f.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.164, 0.355) (B) (0.085, 0.298)" }, { "from": "gpt", "value": "(A) (0.164, 0.355)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/037596c8adbb52db.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if red paper bag at center is positioned below matte plastic canister at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, red paper bag at center is not below matte plastic canister at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a87d9201e862bd0d.jpg", "conversations": [ { "from": "human", "value": "\nDoes green patina sculpture at center have a smaller size compared to green grassy field at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/01ffe5a57ccff9c6.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is floral fabric book at center located relative to white fabric doll at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48023da6d29043b8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.829, 0.650) (B) (0.545, 0.336)" }, { "from": "gpt", "value": "(A) (0.829, 0.650)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb6e0e7558323f40.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) black leather jacket at center (B) wooden frame shop window at center (C) matte black awning at upper center" }, { "from": "gpt", "value": "(A) black leather jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f3802c478919e25.jpg", "conversations": [ { "from": "human", "value": "\nDoes wooden table at center appear under matte gray monitor at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/84cbd8f4fe25982e.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue goggles at center thinner than blue matte goggles at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, matte blue goggles at center might be wider than blue matte goggles at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00aef3e49d49ee2b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) green leafy bush at upper left (B) green grass at center, is positioned farthest from the white fluffy bush at upper right?" }, { "from": "gpt", "value": "(A) green leafy bush at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/179bf19f93958118.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the granite gravestone at right among (A) gray stone gravestone at center (B) rusty metal cross at center (C) speckled stone gravestone at center (D) green grassy at lower center?" }, { "from": "gpt", "value": "(A) gray stone gravestone at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adbe93bb45673c03.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white plastic microphone at upper center (B) matte black vest at left (C) smooth bald head at lower left" }, { "from": "gpt", "value": "(C) smooth bald head at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2d9df587ecb3fce6.jpg", "conversations": [ { "from": "human", "value": "\nDoes white weathered wood fence at center have a lesser width compared to green leafy tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white weathered wood fence at center is thinner than green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d1f96213a5ed599.jpg", "conversations": [ { "from": "human", "value": "\nDoes transparent plastic shower curtain at center appear under brownhair at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, transparent plastic shower curtain at center is not positioned below brownhair at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c549ac84100873f4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.348, 0.681) (B) (0.354, 0.148) (C) (0.307, 0.650)" }, { "from": "gpt", "value": "(C) (0.307, 0.650)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/30f8bd5e6d99760e.jpg", "conversations": [ { "from": "human", "value": "\nIs golden ornate palace at center below wooden boat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, golden ornate palace at center is not below wooden boat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eee4d9eed0e89ead.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.734, 0.542) (B) (0.563, 0.652)" }, { "from": "gpt", "value": "(B) (0.563, 0.652)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/78c5c60ab3f86161.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.740, 0.248) (B) (0.223, 0.681)" }, { "from": "gpt", "value": "(A) (0.740, 0.248)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c419378f7ecd5d60.jpg", "conversations": [ { "from": "human", "value": "\nIs green wool coat at right further to the viewer compared to clear glass wine glass at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7a7b54524212b42.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte blue paddle at center is positioned above red nylon life jacket at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3663349b94840d38.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grassy field at lower center have a smaller size compared to yellow leafy tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, green grassy field at lower center might be larger than yellow leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2e8bcd51c605047a.jpg", "conversations": [ { "from": "human", "value": "\nIs gold metallic rally car at center thinner than white casual clothing at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, gold metallic rally car at center's width is less than white casual clothing at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7d0ebf08a9a344cc.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) satin black suit at center (B) satin dress at center" }, { "from": "gpt", "value": "(B) satin dress at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4a6fb33848626c92.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white plastic boat at lower center is positioned above white plastic boat at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white plastic boat at lower center is not above white plastic boat at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5afd4a0159d98e1b.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) shiny black car at center (B) yellow/yellowish paper at upper right" }, { "from": "gpt", "value": "(A) shiny black car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a2c36c4ebe7530b4.jpg", "conversations": [ { "from": "human", "value": "\nIs denim jeans at center below matte blue shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3bf0bc31e4cca408.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.618, 0.473) (B) (0.237, 0.428)" }, { "from": "gpt", "value": "(A) (0.618, 0.473)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c48776390865edef.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte shirt at center closer to the viewer compared to smooth black hair at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9c7abec2ee949f42.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the matte black camera at left? (A) matte black blazer at center (B) white striped shirt at center" }, { "from": "gpt", "value": "(A) matte black blazer at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6f59d5b9251f4e75.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass field at center appear under white mesh net at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/be9b8c0fa3a7a170.jpg", "conversations": [ { "from": "human", "value": "\nIs asphalt road at lower left wider than silver metallic van at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e51c7c58f8b26e7b.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue fabric shirt at right appear over white plastic drone at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09acf266aa4d15ea.jpg", "conversations": [ { "from": "human", "value": "\nIs white stone mask at left to the right of matte stone face at upper left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white stone mask at left is to the right of matte stone face at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6ee5178f18c6887.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white cotton shirt at lower left (B) clear water at center" }, { "from": "gpt", "value": "(B) clear water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0aef1cbaacfa77dd.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.306, 0.647) (B) (0.967, 0.863) (C) (0.131, 0.098) (D) (0.715, 0.825)" }, { "from": "gpt", "value": "(B) (0.967, 0.863)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96bf701f4722df1f.jpg", "conversations": [ { "from": "human", "value": "\nIs black textured jacket at center further to camera compared to white fabric flag at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c785289ccf75ba28.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellowish paper book at center appear on the left side of black fabric at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, yellowish paper book at center is to the left of black fabric at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f8bb6ca23aa2d9d1.jpg", "conversations": [ { "from": "human", "value": "\nDoes striped cotton shirt at center lie in front of black plastic goggles at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a3f2eabd67963cb3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.530, 0.556) (B) (0.907, 0.161)" }, { "from": "gpt", "value": "(B) (0.907, 0.161)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5c10c8060672d84.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the metallic gold entertainment center at center from the following options: (A) brown textured column at left (B) brown polished column at center (C) white glossy washing machine at center (D) white matte cabinet at right?" }, { "from": "gpt", "value": "(D) white matte cabinet at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/841d0bf480c49d01.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white matte shirt at center (B) black matte tank top at center (C) translucent glass at lower center" }, { "from": "gpt", "value": "(A) white matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c53c0c27b5309464.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.532, 0.295) (B) (0.157, 0.545) (C) (0.749, 0.245) (D) (0.128, 0.969)" }, { "from": "gpt", "value": "(B) (0.157, 0.545)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/634f6528ec8af3b6.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black jacket at center closer to the viewer compared to gray matte hair at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9850e5905e2ab9bf.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of clear plastic glasses at left in reference to smooth skin nose at center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cd8efe43cb55b177.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if dark blue shorts at right is positioned below white cotton shirt at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, dark blue shorts at right is positioned under white cotton shirt at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f48f7bacbb59c029.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the pink plastic phone at center from the following options: (A) beige leather chair at lower left (B) metallic silver chair at lower right?" }, { "from": "gpt", "value": "(B) metallic silver chair at lower right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80bcf087b989aacc.jpg", "conversations": [ { "from": "human", "value": "\nIs striped cotton shirt at center closer to camera compared to striped shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/869af7f272bd02ed.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink plastic chair at center appear over matte orange plush rabbit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb297e06bda79bd4.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.642, 0.952) (B) (0.206, 0.978)" }, { "from": "gpt", "value": "(A) (0.642, 0.952)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8024be7747d42c95.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the brown woolen jacket at center? (A) dark gray sweater at center (B) black suit at center" }, { "from": "gpt", "value": "(A) dark gray sweater at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4430dd316bacdd00.jpg", "conversations": [ { "from": "human", "value": "\nDoes black fur dog at center appear under white fur with brown spots at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, black fur dog at center is not positioned below white fur with brown spots at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7659a1d73db3a9d3.jpg", "conversations": [ { "from": "human", "value": "\nObserving the image, what is the correct spatial positioning of dark blue dotted fabric tie at center in reference to matte black hand at upper center? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0855e98dee0c73ac.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray suit at center is positioned to the right of wooden picture frame at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find gray suit at center to the right of wooden picture frame at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f45456b78ccb0edc.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.977, 0.494) (B) (0.406, 0.727) (C) (0.311, 0.941)" }, { "from": "gpt", "value": "(B) (0.406, 0.727)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e90d82f8cdf90f91.jpg", "conversations": [ { "from": "human", "value": "\nIs black leather jacket at lower right bigger than black leather earring at ear? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, black leather jacket at lower right is larger in size than black leather earring at ear." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fdc1d6955edcf987.jpg", "conversations": [ { "from": "human", "value": "\nIs green grass at lower left to the left of green leafy tree at left from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, green grass at lower left is not to the left of green leafy tree at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad6d34259c52a2dd.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the white soft shirt at lower center? (A) dark blue fleece jacket at center (B) dark brown leather jacket at lower center (C) pink fabric dress at center" }, { "from": "gpt", "value": "(A) dark blue fleece jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e164311c62c0fc81.jpg", "conversations": [ { "from": "human", "value": "\nDoes pink fabric shirt at upper left have a larger size compared to pink fabric at upper left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, pink fabric shirt at upper left has a larger size compared to pink fabric at upper left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3048d13c448ceefd.jpg", "conversations": [ { "from": "human", "value": "\nIs brown cardboard boxes at lower left to the right of orange matte jacket at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, brown cardboard boxes at lower left is not on the right side of orange matte jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1c91f23dde2ad716.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is positioned farthest from the pink hair at right? Select from: (A) graysoftbeard at center (B) white matte shirt at center" }, { "from": "gpt", "value": "(A) graysoftbeard at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/820f5aeef9ba8d5f.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton t-shirt at center to the left of light blue jeans at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white cotton t-shirt at center is not to the left of light blue jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9915cd74526cd47.jpg", "conversations": [ { "from": "human", "value": "\nIs matte blue jersey at center bigger than blue quilted jacket at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, matte blue jersey at center is not larger than blue quilted jacket at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/46e2ab231df66458.jpg", "conversations": [ { "from": "human", "value": "\nIs greenish-blue water at center wider than bamboo placemat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, greenish-blue water at center is wider than bamboo placemat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/eb4aee5704c6a5ec.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.012, 0.656) (B) (0.902, 0.252)" }, { "from": "gpt", "value": "(A) (0.012, 0.656)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6267ef32e21d0e7f.jpg", "conversations": [ { "from": "human", "value": "\nDoes brown muddy water at center have a greater width compared to rustic rock canyon at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7fe4189598486848.jpg", "conversations": [ { "from": "human", "value": "\nDoes green smooth water at center have a lesser width compared to green leafy tree at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, green smooth water at center's width is not less than green leafy tree at lower center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a70c2ffc054566e8.jpg", "conversations": [ { "from": "human", "value": "\nIs glossy blue motorcycle at left bigger than denim shorts at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, glossy blue motorcycle at left has a larger size compared to denim shorts at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6a3614666ffbc4eb.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of blue fabric backpack at center in relation to black and white striped pants at lower right? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a4095e4e7d1a4f10.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.811, 0.606) (B) (0.144, 0.400) (C) (0.293, 0.547) (D) (0.949, 0.994)" }, { "from": "gpt", "value": "(B) (0.144, 0.400)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1c750c03d689b68.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the brushed metal pavement at center among (A) blue matte helmet at upper center (B) blue matte helmet at upper left (C) white matte bicycle at center (D) yellow matte shirt at center?" }, { "from": "gpt", "value": "(D) yellow matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d5e596fc55929c5e.jpg", "conversations": [ { "from": "human", "value": "\nDoes white foamy wave at lower center lie in front of orange rubber ring at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/64b3ee49358d9a74.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) dark gray fabric umbrella at center (B) beige stone railing at center (C) brown stone statue at upper right (D) matte gray guitar at center" }, { "from": "gpt", "value": "(D) matte gray guitar at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ed75f05058af0305.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray metallic car at lower right further to the viewer compared to rubberized red car at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d506f6977ebc9768.jpg", "conversations": [ { "from": "human", "value": "\nWhere is metallic gray concrete finisher at center located in relation to maroon fabric shirt at upper left in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c017672da9277c1d.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if blue water at center is wider than teal matte boat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dc8869c6cf46b78f.jpg", "conversations": [ { "from": "human", "value": "\nDoes bare branches at center appear over brown leafless branches at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, bare branches at center is located above brown leafless branches at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b81a9a80f3132373.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of green matte t-shirt at center and white matte boats at left in the image provided, where is green matte t-shirt at center located with respect to white matte boats at left? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bf37bb25a3c5a30b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.217, 0.558) (B) (0.737, 0.605)" }, { "from": "gpt", "value": "(B) (0.737, 0.605)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/721eb0e8a56de8a5.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green fabric flagpole at upper center (B) dark stone castle at upper center (C) green fabric flag at upper center" }, { "from": "gpt", "value": "(B) dark stone castle at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb704d012f94fc13.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden pergola at center behind wooden at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, wooden pergola at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e7dfe06fd065cd4.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) matte plastic goggles at center (B) beige cotton shirt at center (C) blue silk saree at center, is positioned farthest from the green leafy water at left?" }, { "from": "gpt", "value": "(A) matte plastic goggles at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/462429369fe066e0.jpg", "conversations": [ { "from": "human", "value": "\nIs black metal pole at upper center to the right of white marble sculpture at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black metal pole at upper center is not to the right of white marble sculpture at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/89acc01a5af97de6.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.712, 0.530) (B) (0.762, 0.316) (C) (0.618, 0.619) (D) (0.408, 0.361)" }, { "from": "gpt", "value": "(B) (0.762, 0.316)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79cb477c8385b7a7.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.562, 0.633) (B) (0.358, 0.536)" }, { "from": "gpt", "value": "(A) (0.562, 0.633)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c590a7d5be4024e7.jpg", "conversations": [ { "from": "human", "value": "\nIs gray textured suit at right to the right of blue striped shirt at right from the viewer's perspective? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, gray textured suit at right is not to the right of blue striped shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ec02ab281e383909.jpg", "conversations": [ { "from": "human", "value": "\nIs black fluffy dog at center wider than shiny black hair at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, black fluffy dog at center is wider than shiny black hair at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d061d6049204df58.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte sculpture at center appear on the left side of gray concrete pavement at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, white matte sculpture at center is not to the left of gray concrete pavement at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/77bb86dc50f8c3c6.jpg", "conversations": [ { "from": "human", "value": "\nDoes light blue shirt at center appear over white fabric table at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, light blue shirt at center is above white fabric table at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fb6abb3eab44166a.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of green grassy trail at center in relation to green matte tree at left? (A) above (B) below" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0601e5f4bace40c0.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.653, 0.181) (B) (0.025, 0.705) (C) (0.030, 0.025) (D) (0.890, 0.778)" }, { "from": "gpt", "value": "(A) (0.653, 0.181)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/077e7164ba6098ad.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte shirt at center appear on the right side of fuzzy brown squirrel at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white matte shirt at center is not on the right side of fuzzy brown squirrel at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c22042814f4e5a40.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear water at lower center have a greater width compared to white glossy boat at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of clear water at lower center exceeds that of white glossy boat at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e0f4e20695d7375a.jpg", "conversations": [ { "from": "human", "value": "\nIs asphalt road at center below green grassy field at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a422b053f8e16487.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.982, 0.059) (B) (0.322, 0.425) (C) (0.794, 0.961)" }, { "from": "gpt", "value": "(A) (0.982, 0.059)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b99d013bcac5419f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if black matte jacket at center is wider than dark blue jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, black matte jacket at center is not wider than dark blue jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/404d176c3d602b90.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if shiny orange goldfish at center is bigger than glossy orange fish at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, shiny orange goldfish at center might be smaller than glossy orange fish at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/68bf05a17091a4bc.jpg", "conversations": [ { "from": "human", "value": "\nDoes green metal fence at center have a greater width compared to black plastic video camera at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, the width of green metal fence at center exceeds that of black plastic video camera at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b8dc7957b219bc64.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) pink fleece jacket at center (B) green paperboard poster at left" }, { "from": "gpt", "value": "(A) pink fleece jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7bbb0c02f2cc30f1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.530, 0.342) (B) (0.909, 0.092)" }, { "from": "gpt", "value": "(A) (0.530, 0.342)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0208853ef61f5d0c.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) striped fabric dress at center (B) translucent glass beverage at center (C) purple striped shirt at center (D) black satin suit at right" }, { "from": "gpt", "value": "(B) translucent glass beverage at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7a24f1e4b7e70a25.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) beige stucco tower at center (B) shiny blue glass skyscraper at center (C) dark blue glass skyscraper at right (D) clear glass tower at upper center" }, { "from": "gpt", "value": "(A) beige stucco tower at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ecbf0a6d2b6be9b9.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if suede brown jacket at center is positioned to the left of denim jeans at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, suede brown jacket at center is to the right of denim jeans at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/607e7ebdfaa29de8.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.113, 0.494) (B) (0.958, 0.362) (C) (0.812, 0.641)" }, { "from": "gpt", "value": "(C) (0.812, 0.641)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e531ecb294ed9efe.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the smooth stone pole at center from the following options: (A) metallic pole at center (B) green patina statue at lower left (C) metallic pole at left?" }, { "from": "gpt", "value": "(A) metallic pole at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/35870b66815d2c8c.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.860, 0.200) (B) (0.424, 0.662)" }, { "from": "gpt", "value": "(B) (0.424, 0.662)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e21feda0457b7945.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear blue water at lower center come behind dark blue fabric crowd at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bd0ae8855c605d48.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.272, 0.812) (B) (0.402, 0.764) (C) (0.152, 0.816)" }, { "from": "gpt", "value": "(B) (0.402, 0.764)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8e05dd8cd22bc24c.jpg", "conversations": [ { "from": "human", "value": "\nDoes silver metallic laptop at lower right have a smaller size compared to brown curly fur dog at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, silver metallic laptop at lower right is not smaller in size than brown curly fur dog at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8b6e12bac7a52a0c.jpg", "conversations": [ { "from": "human", "value": "\nIs concrete tarmac at center wider than transparent water at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, concrete tarmac at center is not wider than transparent water at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d545f1695aa75141.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) black matte camera at right (B) matte black suit at center (C) matte gray suit at left (D) dark gray fabric chair at center" }, { "from": "gpt", "value": "(D) dark gray fabric chair at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dd3fa7a12d72507b.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the light brown smooth dog at center? (A) brown fur dog at center (B) black glossy teeth at center (C) brown dirt track at lower center" }, { "from": "gpt", "value": "(C) brown dirt track at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1890ab461a2a5a86.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.777, 0.431) (B) (0.537, 0.487)" }, { "from": "gpt", "value": "(A) (0.777, 0.431)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca400852ab673846.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.461, 0.628) (B) (0.723, 0.908)" }, { "from": "gpt", "value": "(A) (0.461, 0.628)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c79d0fd7b47db6cf.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if gray concrete sidewalk at lower right is positioned to the right of matte red tower at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, gray concrete sidewalk at lower right is to the left of matte red tower at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83382ae4710a04c4.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) dark green textured pine tree at upper left (B) dark green textured pine tree at left" }, { "from": "gpt", "value": "(A) dark green textured pine tree at upper left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/caf2a691ea39874a.jpg", "conversations": [ { "from": "human", "value": "\nIs black plastic ruler at upper right thinner than blue plastic needle at right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, black plastic ruler at upper right might be wider than blue plastic needle at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29b97de53cc8e732.jpg", "conversations": [ { "from": "human", "value": "\nDoes clear water at river right appear on the left side of camouflage fabric uniform at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, clear water at river right is not to the left of camouflage fabric uniform at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8c2620b731936295.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) blue tile swimming pool at center (B) skinny man at center" }, { "from": "gpt", "value": "(A) blue tile swimming pool at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9ca69b01c68de28e.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) blue striped shirt at left (B) white cotton polo shirt at center, is positioned farthest from the white glossy car at right?" }, { "from": "gpt", "value": "(A) blue striped shirt at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7612f1b41b624f60.jpg", "conversations": [ { "from": "human", "value": "\nIs camouflage shorts at left positioned in front of white foam board at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/23dda368fe4013de.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is dark brown wrought iron at center located relative to rusty metal clock at center? (A) right (B) left" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/43e29d101724ba2d.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the white stone bell tower at upper left? (A) brown feathered bird at upper center (B) white stone tower at upper right" }, { "from": "gpt", "value": "(A) brown feathered bird at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e4b7cf2a36c545b2.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny silver car at lower left below white glossy car at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/60c408ef0ea374d3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) striped sweater at right (B) dark gray textured shirt at center (C) checkered fabric shirt at right" }, { "from": "gpt", "value": "(A) striped sweater at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d9ed882069fefb83.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow reflective vest at center have a larger size compared to smooth leather jacket at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, yellow reflective vest at center is not bigger than smooth leather jacket at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de336471f2b14414.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cotton baby at center is wider than translucent plastic bottle at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, white cotton baby at center is wider than translucent plastic bottle at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b43fb8054b39e35d.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the light blue button-down shirt at left? (A) blue cotton shirt at center (B) gray matte shirt at upper right" }, { "from": "gpt", "value": "(B) gray matte shirt at upper right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/905d5fe809602771.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.547, 0.928) (B) (0.508, 0.445)" }, { "from": "gpt", "value": "(B) (0.508, 0.445)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bdb12391864480d4.jpg", "conversations": [ { "from": "human", "value": "\nIs dark gray stone temple at center bigger than green leafy tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, dark gray stone temple at center is larger in size than green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/02e810ec6c47c0d4.jpg", "conversations": [ { "from": "human", "value": "\nDoes metallic blue train at center have a smaller size compared to metal/smooth train tracks at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, metallic blue train at center is not smaller than metal/smooth train tracks at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0d6312138c7e42fe.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown glass bottle at left is wider than metallic silver suv at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, brown glass bottle at left might be narrower than metallic silver suv at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c5c983bed600451b.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.240, 0.878) (B) (0.755, 0.773)" }, { "from": "gpt", "value": "(B) (0.755, 0.773)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1345db06f1f400f0.jpg", "conversations": [ { "from": "human", "value": "\nIs blue and white striped jersey at center smaller than white matte goal at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, blue and white striped jersey at center has a smaller size compared to white matte goal at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/baec54a4a3f8c5cd.jpg", "conversations": [ { "from": "human", "value": "\nIs white cotton shirt at center bigger than matte black dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white cotton shirt at center is not bigger than matte black dress at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1be6fe4d0a765082.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) wooden table at lower center (B) light brown shirt at center (C) white cotton jacket at right" }, { "from": "gpt", "value": "(B) light brown shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/88163fd39d486078.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) green matte tree at upper center (B) green textured tree at upper center (C) clear sand at bottom (D) clear water at center" }, { "from": "gpt", "value": "(A) green matte tree at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/058cb40e1d5cd201.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) clear water at center (B) white cotton shirt at upper center" }, { "from": "gpt", "value": "(A) clear water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/deac707e7a770b58.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of yellow matte shirt at right in relation to orange cotton pants at left? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/309ec59809d379d8.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is farther from the matte blue shirt at center among (A) black matte shirt at center (B) matte red shirt at center?" }, { "from": "gpt", "value": "(A) black matte shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29e807865b8acd60.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is nearest to the camera? (A) (0.421, 0.598) (B) (0.317, 0.533)" }, { "from": "gpt", "value": "(B) (0.317, 0.533)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/36768919b6a87787.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black jacket at center have a greater width compared to wooden at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, matte black jacket at center is wider than wooden at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2393b3aaaa407465.jpg", "conversations": [ { "from": "human", "value": "\nDoes white stone floor at center have a smaller size compared to light beige stone column at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Incorrect, white stone floor at center is not smaller in size than light beige stone column at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/780b4423c0ea3faf.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the black fur dog at lower left from the following options: (A) weathered wood at center (B) blue fabric shoe at lower left?" }, { "from": "gpt", "value": "(B) blue fabric shoe at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/79cbee9cff263294.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is farther from the green stone wall at right? Choose from: (A) yellow matte shirt at center (B) black matte visor at upper center" }, { "from": "gpt", "value": "(B) black matte visor at upper center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5fae5c9d18787867.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.147, 0.655) (B) (0.751, 0.578) (C) (0.544, 0.367)" }, { "from": "gpt", "value": "(B) (0.751, 0.578)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/14affbe0c7b95adf.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) transparent glass window at upper left (B) green felt pool table at center, is positioned farthest from the white matte stool at lower left?" }, { "from": "gpt", "value": "(B) green felt pool table at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2fe607a42f3fb590.jpg", "conversations": [ { "from": "human", "value": "\nDoes red matte shirt at center come behind green fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/fcf93248ce5934c2.jpg", "conversations": [ { "from": "human", "value": "\nIs brown brick castle at center further to the viewer compared to green grassy bank at lower left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2deb9a042caffc4c.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.407, 0.584) (B) (0.050, 0.980)" }, { "from": "gpt", "value": "(A) (0.407, 0.584)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9684fc73a4155771.jpg", "conversations": [ { "from": "human", "value": "\nIs matte white screen at upper center bigger than matte black screen at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, matte white screen at upper center is larger in size than matte black screen at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ba266fb9c4061847.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte beige sweater at upper right appear on the right side of dark brown leather jacket at upper right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, matte beige sweater at upper right is to the left of dark brown leather jacket at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71bf6d012638db2c.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the silhouette leafy tree at center? (A) black silhouette palm tree at center (B) silky black palm tree at upper left" }, { "from": "gpt", "value": "(A) black silhouette palm tree at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/71f4c9bea7db5e64.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue sequined dress at center lie in front of light blue sweatshirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/20c25a2ef0245d1b.jpg", "conversations": [ { "from": "human", "value": "\nIs dark brown fabric saree at lower center above dark printed fabric at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2f33a49b6828ed71.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.387, 0.328) (B) (0.375, 0.787)" }, { "from": "gpt", "value": "(A) (0.387, 0.328)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f5ebc4f4b1e11770.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) translucent yellow ant at center (B) yellow matte ant at center-right (C) orange matte ant at center (D) translucent yellow ant at lower left" }, { "from": "gpt", "value": "(C) orange matte ant at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cf16b3a761e9a9fa.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.623, 0.572) (B) (0.009, 0.711) (C) (0.343, 0.558) (D) (0.815, 0.591)" }, { "from": "gpt", "value": "(A) (0.623, 0.572)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3783ca6dc4d49e26.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) blue fuzzy hair at right (B) shiny gold eye at center" }, { "from": "gpt", "value": "(B) shiny gold eye at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/95a30c3a3e8f222e.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at right further to the viewer compared to green leafy bush at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) That is False." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0277f025b3d1841f.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is farthest from the black matte sunglasses at center from the following options: (A) tan fabric baseball cap at upper center (B) yellow matte life vest at center (C) wooden paddle at center (D) smooth gray canoe at center?" }, { "from": "gpt", "value": "(C) wooden paddle at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c1925905339390a3.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of matte blue fabric dress at center and pink satin saree at center in the image provided, where is matte blue fabric dress at center located with respect to pink satin saree at center? (A) left (B) right" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/dba4d184eab70544.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if bare branches at center is positioned below bare branches at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, bare branches at center is below bare branches at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45fa0fe46f403957.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.826, 0.330) (B) (0.327, 0.580) (C) (0.706, 0.270)" }, { "from": "gpt", "value": "(B) (0.327, 0.580)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/caa2db56b6b008ab.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.094, 0.745) (B) (0.354, 0.520) (C) (0.810, 0.492) (D) (0.517, 0.559)" }, { "from": "gpt", "value": "(C) (0.810, 0.492)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ecb85c5334fc4e1e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.171, 0.523) (B) (0.444, 0.606)" }, { "from": "gpt", "value": "(A) (0.171, 0.523)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6bea7a0d6a5f6b18.jpg", "conversations": [ { "from": "human", "value": "\nIs gray metallic water at center wider than rusty metal ship at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, gray metallic water at center is wider than rusty metal ship at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/85a6968133f6201c.jpg", "conversations": [ { "from": "human", "value": "\nIs white bread at left below green leafy at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b36b3da0cad5cff0.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the silver metallic laptop at left? (A) white wooden door at center (B) wooden cabinet at right" }, { "from": "gpt", "value": "(A) white wooden door at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c6eaad5af5acc9ca.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grass at center have a smaller size compared to spotted brown giraffe at left? (A) no (B) yes" }, { "from": "gpt", "value": "(A) Actually, green grass at center might be larger than spotted brown giraffe at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ad587cb3cd2c9bf7.jpg", "conversations": [ { "from": "human", "value": "\nDoes green grassy field at lower center have a larger size compared to metallic silver helicopter at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, green grassy field at lower center is larger in size than metallic silver helicopter at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f34804e5fc3a5389.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of clear water at lower left in relation to white glossy ferry at center-right? (A) above (B) below" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/09146cba8ccf04d5.jpg", "conversations": [ { "from": "human", "value": "\nWhich of these objects: (A) clear water at center (B) brown fur deer at center, is positioned farthest from the brown matte/deer at center?" }, { "from": "gpt", "value": "(A) clear water at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0a7ac4f572a33d0e.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is nearest to the camera? (A) dark brown textured trunk at center (B) dark brown bark at upper left" }, { "from": "gpt", "value": "(A) dark brown textured trunk at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b196001fb176d5dd.jpg", "conversations": [ { "from": "human", "value": "\nDoes white lace tablecloth at center come in front of yellow creamy cake at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, white lace tablecloth at center is in front of yellow creamy cake at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1d1b527d57cfa2b3.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue fabric couch at center have a smaller size compared to brown leather jacket at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, blue fabric couch at center is smaller than brown leather jacket at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/94b4be144c65599b.jpg", "conversations": [ { "from": "human", "value": "\nIs matte dark red canoe at center bigger than matte red canoe at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/314aff9a5973db47.jpg", "conversations": [ { "from": "human", "value": "\nWhich is farther from the purple floral fabric dress at center? (A) blue plaid shirt at lower left (B) beige stone stairs at center" }, { "from": "gpt", "value": "(A) blue plaid shirt at lower left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/801940c781d35656.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black backpack at center to the left of dark gray t-shirt at center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, you'll find matte black backpack at center to the left of dark gray t-shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e3fa3577c952ffbd.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.198, 0.487) (B) (0.988, 0.411) (C) (0.427, 0.911)" }, { "from": "gpt", "value": "(A) (0.198, 0.487)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/11f742f063279699.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if denim jacket at center is positioned to the right of brown leather jacket at upper right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, denim jacket at center is not on the right side of brown leather jacket at upper right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5002f2c1304c4dd3.jpg", "conversations": [ { "from": "human", "value": "\nAmong these points, which one is farthest from the camera? (A) (0.331, 0.259) (B) (0.775, 0.277) (C) (0.151, 0.659)" }, { "from": "gpt", "value": "(A) (0.331, 0.259)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d7b3bda030295a88.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if satin black monitor at center is bigger than blue glossy screen at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/269d38649cf211e8.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white fabric at upper right is thinner than shiny gold statue at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9858c8edf50cdfe7.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown fur hyaena at center is bigger than green grass at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, brown fur hyaena at center is larger in size than green grass at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/509bf2e919ced9bb.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.631, 0.641) (B) (0.351, 0.942)" }, { "from": "gpt", "value": "(A) (0.631, 0.641)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/100d7e84809d6c2b.jpg", "conversations": [ { "from": "human", "value": "\nIs green leafy tree at center closer to the viewer compared to transparent text at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, green leafy tree at center is further to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/630d1855afe315bf.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the brown matte window at upper left? (A) white glossy countertop at lower left (B) satin nickel faucet at sink left" }, { "from": "gpt", "value": "(B) satin nickel faucet at sink left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ea8e292f0cc422c1.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) green leafy branch at center (B) gray matte bird at center" }, { "from": "gpt", "value": "(A) green leafy branch at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8e53f8e393eca59.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if rusty brick wall at right is wider than brown dirt path at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, rusty brick wall at right is not wider than brown dirt path at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2aea93c5414e8ca8.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) smooth metal train track at center (B) silver metallic train at center" }, { "from": "gpt", "value": "(A) smooth metal train track at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a3e514cca0af0da.jpg", "conversations": [ { "from": "human", "value": "\nWhich is nearer to the embroidered cotton skirt at center? (A) embroidered velvet skirt at center (B) green satin apron at center (C) matte orange skirt at left" }, { "from": "gpt", "value": "(A) embroidered velvet skirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4433ff86cf66407.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) matte black jacket at left (B) golden crumbly cookie at upper center (C) golden crumbly biscuit at center" }, { "from": "gpt", "value": "(C) golden crumbly biscuit at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/62c1cd79dbaee478.jpg", "conversations": [ { "from": "human", "value": "\nDoes white cotton shirt at center lie behind smooth purple blouse at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, white cotton shirt at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2b1f9229556878d7.jpg", "conversations": [ { "from": "human", "value": "\nIs brown matte/deer at right to the left of brown matte/deer at left from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, brown matte/deer at right is to the right of brown matte/deer at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6df7b19fae858f45.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown suede cloak at center is positioned below matte gold tunic at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown suede cloak at center is below matte gold tunic at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0ba937fe80c8137f.jpg", "conversations": [ { "from": "human", "value": "\nIs silhouette figure at right wider than dark reflective water at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8a58afecf996b41f.jpg", "conversations": [ { "from": "human", "value": "\nDoes matte black swing at center have a greater width compared to transparent plastic goggles at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/e8273ac2e6369d2a.jpg", "conversations": [ { "from": "human", "value": "\nBased on their relative distances, which object is nearer to the pink polka dot swimsuit at center? Choose from: (A) smooth skin children at center (B) multicolored woven bag at upper left" }, { "from": "gpt", "value": "(A) smooth skin children at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/00247905d60ab179.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) white matte shirt at center (B) white matte hat at lower center (C) matte white umbrella at center" }, { "from": "gpt", "value": "(B) white matte hat at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/53152bfb1f72be32.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if matte blue train carriages at center is positioned to the right of smooth concrete train track at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte blue train carriages at center is not on the right side of smooth concrete train track at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ca2ef0bc638c301f.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if white cotton shirt at left is thinner than white shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Correct, white cotton shirt at left's width is less than white shirt at left's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/45e93f5e3cec3570.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther from the camera taking this photo? (A) (0.917, 0.675) (B) (0.999, 0.644) (C) (0.314, 0.927)" }, { "from": "gpt", "value": "(B) (0.999, 0.644)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/545ec5018979f798.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.177, 0.519) (B) (0.921, 0.467)" }, { "from": "gpt", "value": "(B) (0.921, 0.467)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/053afe451600ee90.jpg", "conversations": [ { "from": "human", "value": "\nDoes white tile floor at center come in front of blue fabric shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, it is in front of blue fabric shirt at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3e1c6ff2b1933003.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown bark tree at left is positioned to the right of green matte tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) In fact, brown bark tree at left is to the left of green matte tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d4daba7dddb6d5df.jpg", "conversations": [ { "from": "human", "value": "\nDoes yellow-green leaves at right come behind dirt path at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of dirt path at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7e9aa5e9e300ccdf.jpg", "conversations": [ { "from": "human", "value": "\nIs shiny dark brown horse at center above smooth gray dog at lower right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, shiny dark brown horse at center is located above smooth gray dog at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3850da9418e7f168.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.470, 0.145) (B) (0.537, 0.986) (C) (0.955, 0.692)" }, { "from": "gpt", "value": "(C) (0.955, 0.692)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/96d33b85c2dab129.jpg", "conversations": [ { "from": "human", "value": "\nIs matte black suit at left smaller than dark gray suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, matte black suit at left is not smaller in size than dark gray suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/83ab59aaf9014f68.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) white fluffy cloud at upper left (B) bare branches at right" }, { "from": "gpt", "value": "(B) bare branches at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6b78e885b3ae0fd1.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if bark textured tree at right is thinner than green leafy tree at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, bark textured tree at right might be wider than green leafy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/de614bc62f53eeca.jpg", "conversations": [ { "from": "human", "value": "\nIs black glossy bull at lower right positioned at the back of black matte bull at lower right? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, it is in front of black matte bull at lower right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/8614c2ab15a5fd00.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) yellow matte signboard at upper center (B) matte yellow poster at center" }, { "from": "gpt", "value": "(B) matte yellow poster at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/cc050557af3536b5.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of smooth wood mast at center in relation to wooden sailboat at lower left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adc65cbc0804eb72.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears closest to the camera in this image? (A) (0.866, 0.597) (B) (0.122, 0.973)" }, { "from": "gpt", "value": "(B) (0.122, 0.973)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c087cb8e333e816f.jpg", "conversations": [ { "from": "human", "value": "\nIs white matte camper van at lower right above matte black car at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/04fa20246b414e6b.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of satin white dress at center and matte gray suit at left in the image provided, where is satin white dress at center located with respect to matte gray suit at left? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5550248c79790d9.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte helmet at center have a lesser width compared to matte brown sweater at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, black matte helmet at center is thinner than matte brown sweater at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/aeb9641106d72060.jpg", "conversations": [ { "from": "human", "value": "\nIs light blue cotton shirt at left further to camera compared to white paper problems at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ce85c990782fbcb1.jpg", "conversations": [ { "from": "human", "value": "\nIs golden-brown foliage at center thinner than white concrete curb at lower center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Correct, golden-brown foliage at center's width is less than white concrete curb at lower center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/646a50e458ae42d3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera taking this photo? (A) (0.252, 0.600) (B) (0.283, 0.619)" }, { "from": "gpt", "value": "(B) (0.283, 0.619)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/adfde9d26c417b9d.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) matte black jacket at center (B) white soft sweater at upper left" }, { "from": "gpt", "value": "(A) matte black jacket at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ab71da0b65920fa3.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.697, 0.487) (B) (0.499, 0.759)" }, { "from": "gpt", "value": "(A) (0.697, 0.487)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a9d6b50dd1918418.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the closest to the blue plaid shirt at center? Choose among these: (A) matte white cap at upper center (B) shiny black motorcycle at center (C) pink fabric shirt at center" }, { "from": "gpt", "value": "(C) pink fabric shirt at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/f612f7673ee56397.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of smooth skin man at center more distant than that of light beige shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, smooth skin man at center is closer to the viewer." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/34e3019061738f3e.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is closer to the camera? (A) (0.550, 0.422) (B) (0.394, 0.466)" }, { "from": "gpt", "value": "(B) (0.394, 0.466)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7cdcd8c73c1e7fe7.jpg", "conversations": [ { "from": "human", "value": "\nFrom the image, what is the correct spatial relationship of red matte sweater at center in relation to white creamy pasta at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/ebb8420d88a741b6.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is the farthest from the dark brown leather jacket at center? Choose among these: (A) dark blue jeans at center (B) shiny black car at center (C) green fabric jacket at center" }, { "from": "gpt", "value": "(B) shiny black car at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7df706c357ddf624.jpg", "conversations": [ { "from": "human", "value": "\nIs brown wool coat at center positioned in front of pink plastic goggles at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes, brown wool coat at center is in front of pink plastic goggles at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/4fb6c942f333e4a5.jpg", "conversations": [ { "from": "human", "value": "\nIs black wool suit at center closer to camera compared to red fabric flag at left? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, black wool suit at center is in front of red fabric flag at left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b5f50f1c74eb47a9.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is farther from the camera taking this photo? (A) concrete bridge at center (B) dull brown dirt track at center" }, { "from": "gpt", "value": "(A) concrete bridge at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c0cde6d19617fb98.jpg", "conversations": [ { "from": "human", "value": "\nWhere is dark blue uniform at center located in relation to matte blue shirt at center in the image? (A) left (B) right" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/813cfe267deac1aa.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the closest to the observer? (A) (0.420, 0.678) (B) (0.216, 0.366) (C) (0.190, 0.266)" }, { "from": "gpt", "value": "(A) (0.420, 0.678)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c3daa03ba30865c6.jpg", "conversations": [ { "from": "human", "value": "\nIs wooden picture frame at upper left to the left of wooden frame at upper center from the viewer's perspective? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, wooden picture frame at upper left is to the left of wooden frame at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/747313e0a5f8a32a.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of white sand beach at center less distant than that of white matte boat at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5dd1a1932e926983.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if bare branches at center is positioned to the left of shiny black car at lower left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, bare branches at center is not to the left of shiny black car at lower left." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/1f8e5d2aebce16ec.jpg", "conversations": [ { "from": "human", "value": "\nWhich object appears farthest from the camera in this image? (A) reddish-pink fabric shorts at center (B) blue fabric shorts at right" }, { "from": "gpt", "value": "(B) blue fabric shorts at right" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/73610ee2a2255b81.jpg", "conversations": [ { "from": "human", "value": "\nWhich point is farther to the camera? (A) (0.417, 0.261) (B) (0.303, 0.994)" }, { "from": "gpt", "value": "(A) (0.417, 0.261)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/80a53889d27634ed.jpg", "conversations": [ { "from": "human", "value": "\nIs green grassy hillside at upper center bigger than wooden hut at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, green grassy hillside at upper center has a larger size compared to wooden hut at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5cae8f16900ce654.jpg", "conversations": [ { "from": "human", "value": "\nWhich point appears farthest from the camera in this image? (A) (0.810, 0.522) (B) (0.918, 0.898) (C) (0.662, 0.625) (D) (0.376, 0.891)" }, { "from": "gpt", "value": "(A) (0.810, 0.522)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/6632c89ccd0d1274.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is matte red dress at left located relative to matte red dress at center? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/29eaa561d3a85367.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte shirt at center appear on the left side of brown leather belt at lower center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white matte shirt at center is not on the left side of brown leather belt at lower center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/37e281c235eb6311.jpg", "conversations": [ { "from": "human", "value": "\nIs floral fabric headscarf at right positioned before white cotton shirt at right? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, floral fabric headscarf at right is in front of white cotton shirt at right." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c47c8373bf28bc62.jpg", "conversations": [ { "from": "human", "value": "\nIn this image, where is smooth stone alley at center located relative to brown fabric table at lower left? (A) below (B) above" }, { "from": "gpt", "value": "(A)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/48867f8014900bc4.jpg", "conversations": [ { "from": "human", "value": "\nDoes white matte t-shirt at center have a smaller size compared to white cotton shirt at left? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/debb5ff2fda3c33f.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) black matte microphone at center (B) black matte microphone at left (C) clear glass bottle at right (D) black metallic microphone at right" }, { "from": "gpt", "value": "(B) black matte microphone at left" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/a7c87afc0be6065d.jpg", "conversations": [ { "from": "human", "value": "\nWhich of the following is the farthest from the observer? (A) (0.332, 0.231) (B) (0.469, 0.184) (C) (0.170, 0.095)" }, { "from": "gpt", "value": "(C) (0.170, 0.095)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/2986821db6aa77b8.jpg", "conversations": [ { "from": "human", "value": "\nDoes purple textured board shorts at upper right come behind white foam surfboard at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) That is True." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/3710b5a3cc37a380.jpg", "conversations": [ { "from": "human", "value": "\nIs black matte tank top at center positioned behind green fabric chair at right? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, it is not." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/158ca958faeb95de.jpg", "conversations": [ { "from": "human", "value": "\nDoes white fabric umbrella at right have a greater width compared to black matte t-shirt at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, white fabric umbrella at right's width does not surpass black matte t-shirt at center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/0b6bf2fdfd7f6beb.jpg", "conversations": [ { "from": "human", "value": "\nDoes creamy smooth column at left have a smaller size compared to creamy smooth column at right? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/07664e8de0f65309.jpg", "conversations": [ { "from": "human", "value": "\nDoes blue fleece jacket at center have a lesser width compared to light brown textured suit at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) In fact, blue fleece jacket at center might be wider than light brown textured suit at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b1aba603416f3c12.jpg", "conversations": [ { "from": "human", "value": "\nEstimate the real-world distances between objects in this image. Which object is closer to the black plastic bags at lower center? (A) white plastic bag at lower center (B) black metal fence at lower left" }, { "from": "gpt", "value": "(A) white plastic bag at lower center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/9f67a227ceabba16.jpg", "conversations": [ { "from": "human", "value": "\nDoes teal satin dress at center lie in front of black floral dress at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Yes." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/bde7949484101615.jpg", "conversations": [ { "from": "human", "value": "\nCan you confirm if brown textured tree at lower center is thinner than white matte bird at upper center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) Incorrect, brown textured tree at lower center's width is not less than white matte bird at upper center's." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/49fd539ca5dddecc.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the relative positions of matte black suit at center and matte black jacket at left in the image provided, where is matte black suit at center located with respect to matte black jacket at left? (A) below (B) above" }, { "from": "gpt", "value": "(B)" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/b97909ded9a4ab5b.jpg", "conversations": [ { "from": "human", "value": "\nConsidering the real-world distances, which object is closest to the black satin blouse at center from the following options: (A) silky red dress at center (B) silky white blouse at center?" }, { "from": "gpt", "value": "(B) silky white blouse at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/76d71b864bc76f5f.jpg", "conversations": [ { "from": "human", "value": "\nDoes black shiny coat at center appear on the right side of brown shiny coat at center? (A) yes (B) no" }, { "from": "gpt", "value": "(A) Indeed, black shiny coat at center is positioned on the right side of brown shiny coat at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d77b2ad45d6f057b.jpg", "conversations": [ { "from": "human", "value": "\nAmong these objects, which one is farthest from the camera? (A) white matte window sill at lower center (B) black wood window at center" }, { "from": "gpt", "value": "(B) black wood window at center" } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/67fcea118beac868.jpg", "conversations": [ { "from": "human", "value": "\nDoes orange fabric umbrella at center appear on the right side of green mossy tree at center? (A) no (B) yes" }, { "from": "gpt", "value": "(A) No, orange fabric umbrella at center is not to the right of green mossy tree at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/5709b1a0e9f83428.jpg", "conversations": [ { "from": "human", "value": "\nIs black asphalt road at center positioned behind black fur bear at center? (A) yes (B) no" }, { "from": "gpt", "value": "(B) No, black asphalt road at center is in front of black fur bear at center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/7097639b7f14a395.jpg", "conversations": [ { "from": "human", "value": "\nIs the position of matte red electric guitar at center more distant than that of gold brass trumpet at center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Yes, it is." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/d0842662cdca8311.jpg", "conversations": [ { "from": "human", "value": "\nDoes black matte shirt at lower left appear on the left side of white matte person at upper center? (A) no (B) yes" }, { "from": "gpt", "value": "(B) Indeed, black matte shirt at lower left is positioned on the left side of white matte person at upper center." } ] }, { "image": "/data/shared/Qwen/RefSpatial/2D/image/c44644cfd5cf8430.jpg", "conversations": [ { "from": "human", "value": "\nWhich object is closer to the camera taking this photo? (A) dark brown hair at center (B) gray cotton shirt at center (C) curly hair at center" }, { "from": "gpt", "value": "(C) curly hair at center" } ] } ]